In [1]:
import torch

In [2]:
from vae import test_nll_estimation, parse_arguments

In [3]:
from pathlib import Path

In [4]:
args = dict(
    data_path='../Data/Dataset',
    device='cuda' if torch.cuda.is_available() else 'cpu',
    embedding_size=300,
    hidden_size=256,
    latent_size=16,
    num_layers=1,
    word_dropout=1.0,
    freebits=None,
    model_save_path='models',
    batch_size_valid=64,
    num_samples=10,
)

In [5]:
def get_approx_nlls(saved_model_files):
    nlls = []
    kls = []
    for saved_model_file in saved_model_files:
        nll, kl = test_nll_estimation(saved_model_file=saved_model_file, **args)
        nlls.append(nll)
        kls.append(kl)
    return nlls, kls

In [6]:
def get_model_filenames(experiment_name='vanilla'):
    saved_model_files = [next(Path(f"results_final/results{i}/{experiment_name}/models/").iterdir()) for i in range(4)]
    saved_model_files = [str(f) for f in saved_model_files]
    return saved_model_files

In [7]:
num_samples = 10

# Vanilla NLL

In [8]:
saved_model_files = get_model_filenames('vanilla')
saved_model_files

['results_final/results0/vanilla/models/sentence_vae_3500.pt',
 'results_final/results1/vanilla/models/sentence_vae_3500.pt',
 'results_final/results2/vanilla/models/sentence_vae_3500.pt',
 'results_final/results3/vanilla/models/sentence_vae_3500.pt']

In [9]:
vanilla_nlls, vanilla_kls = get_approx_nlls(saved_model_files)

  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .44it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .44it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .44it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 20%|██        | 2/10 [00:00<00:00, 17.44it/s][A
 50%|█████     | 5/10 [00:00<00:00, 19.30it/s][A

nll mean: 117.36602783203125 	 kl mean: 0.04554252326488495 	 loss mean: 117.41157531738281
nll mean: 117.49462890625 	 kl mean: 0.04554252326488495 	 loss mean: 117.54017639160156
nll mean: 117.374267578125 	 kl mean: 0.04554252326488495 	 loss mean: 117.41981506347656
nll mean: 117.51228332519531 	 kl mean: 0.04554252326488495 	 loss mean: 117.55781555175781
nll mean: 117.468994140625 	 kl mean: 0.04554252326488495 	 loss mean: 117.51454162597656


                                      
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .30it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .30it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 50%|█████     | 5/10 [00:00<00:00, 19.30it/s][A
                                      .86it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .86it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 23.49it/s][A
  3%|▎         | 1/38 [00:00<00:15,  2.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 117.43952178955078 	 kl mean: 0.04554252326488495 	 loss mean: 117.48506927490234
nll mean: 117.55322265625 	 kl mean: 0.04554252326488495 	 loss mean: 117.59877014160156
nll mean: 117.46664428710938 	 kl mean: 0.04554252326488495 	 loss mean: 117.51219177246094
nll mean: 117.52050018310547 	 kl mean: 0.04554252326488495 	 loss mean: 117.5660400390625
nll mean: 117.46519470214844 	 kl mean: 0.04554252326488495 	 loss mean: 117.51072692871094


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.34it/s]
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.34it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.34it/s]
 20%|██        | 2/10 [00:00<00:00, 15.63it/s][A
 40%|████      | 4/10 [00:00<00:00, 15.58it/s][A

nll mean: 132.68283081054688 	 kl mean: 0.052283305674791336 	 loss mean: 132.735107421875
nll mean: 132.75253295898438 	 kl mean: 0.052283305674791336 	 loss mean: 132.80484008789062
nll mean: 132.7010955810547 	 kl mean: 0.052283305674791336 	 loss mean: 132.7533721923828
nll mean: 132.7313232421875 	 kl mean: 0.052283305674791336 	 loss mean: 132.78363037109375


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.34it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.34it/s]
 40%|████      | 4/10 [00:00<00:00, 15.58it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.34it/s]
 60%|██████    | 6/10 [00:00<00:00, 15.68it/s][A

nll mean: 132.6934356689453 	 kl mean: 0.052283305674791336 	 loss mean: 132.7457275390625
nll mean: 132.7171173095703 	 kl mean: 0.052283305674791336 	 loss mean: 132.76939392089844
nll mean: 132.75668334960938 	 kl mean: 0.052283305674791336 	 loss mean: 132.80897521972656


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.34it/s]
 60%|██████    | 6/10 [00:00<00:00, 15.68it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:15,  2.34it/s]
                                              [A
  3%|▎         | 1/38 [00:01<00:15,  2.34it/s]
 80%|████████  | 8/10 [00:00<00:00, 15.34it/s][A
100%|██████████| 10/10 [00:00<00:00, 15.27it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 132.6312713623047 	 kl mean: 0.052283305674791336 	 loss mean: 132.6835479736328
nll mean: 132.6751251220703 	 kl mean: 0.052283305674791336 	 loss mean: 132.7274169921875
nll mean: 132.66717529296875 	 kl mean: 0.052283305674791336 	 loss mean: 132.719482421875
nll mean: 104.59174346923828 	 kl mean: 0.052214737981557846 	 loss mean: 104.64395141601562


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 26.87it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 60%|██████    | 6/10 [00:00<00:00, 26.77it/s][A

nll mean: 104.52933502197266 	 kl mean: 0.052214737981557846 	 loss mean: 104.58155059814453
nll mean: 104.57830810546875 	 kl mean: 0.052214737981557846 	 loss mean: 104.63052368164062
nll mean: 104.56492614746094 	 kl mean: 0.052214737981557846 	 loss mean: 104.61714172363281
nll mean: 104.5521240234375 	 kl mean: 0.052214737981557846 	 loss mean: 104.60433959960938
nll mean: 104.54399108886719 	 kl mean: 0.052214737981557846 	 loss mean: 104.59620666503906
nll mean: 104.49931335449219 	 kl mean: 0.052214737981557846 	 loss mean: 104.55152893066406


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 60%|██████    | 6/10 [00:00<00:00, 26.77it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
100%|██████████| 10/10 [00:00<00:00, 26.35it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.16it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.16it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 104.53692626953125 	 kl mean: 0.052214737981557846 	 loss mean: 104.58914184570312
nll mean: 104.51988220214844 	 kl mean: 0.052214737981557846 	 loss mean: 104.57209014892578
nll mean: 104.54942321777344 	 kl mean: 0.052214737981557846 	 loss mean: 104.60162353515625
nll mean: 144.59872436523438 	 kl mean: 0.05813896656036377 	 loss mean: 144.6568603515625


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.16it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.16it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.16it/s]
 20%|██        | 2/10 [00:00<00:00, 11.19it/s][A
 40%|████      | 4/10 [00:00<00:00, 11.24it/s][A

nll mean: 144.66683959960938 	 kl mean: 0.05813896656036377 	 loss mean: 144.7249755859375
nll mean: 144.69651794433594 	 kl mean: 0.05813896656036377 	 loss mean: 144.75466918945312
nll mean: 144.65924072265625 	 kl mean: 0.05813896656036377 	 loss mean: 144.71737670898438


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.16it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.16it/s]
 40%|████      | 4/10 [00:00<00:00, 11.24it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.16it/s]
 60%|██████    | 6/10 [00:00<00:00, 11.32it/s][A

nll mean: 144.67593383789062 	 kl mean: 0.05813896656036377 	 loss mean: 144.7340545654297
nll mean: 144.62847900390625 	 kl mean: 0.05813896656036377 	 loss mean: 144.68663024902344
nll mean: 144.6461181640625 	 kl mean: 0.05813896656036377 	 loss mean: 144.70425415039062


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.16it/s]
 60%|██████    | 6/10 [00:00<00:00, 11.32it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.16it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.16it/s]
 80%|████████  | 8/10 [00:00<00:00, 11.33it/s][A
100%|██████████| 10/10 [00:00<00:00, 11.35it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 144.68714904785156 	 kl mean: 0.05813896656036377 	 loss mean: 144.7452850341797
nll mean: 144.71377563476562 	 kl mean: 0.05813896656036377 	 loss mean: 144.77191162109375
nll mean: 144.57373046875 	 kl mean: 0.05813896656036377 	 loss mean: 144.63186645507812


                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
 20%|██        | 2/10 [00:00<00:00, 14.51it/s][A

nll mean: 130.7947540283203 	 kl mean: 0.04776104912161827 	 loss mean: 130.84251403808594
nll mean: 130.77017211914062 	 kl mean: 0.04776104912161827 	 loss mean: 130.81793212890625
nll mean: 130.68553161621094 	 kl mean: 0.04776104912161827 	 loss mean: 130.73330688476562


                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
 20%|██        | 2/10 [00:00<00:00, 14.51it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
 40%|████      | 4/10 [00:00<00:00, 14.49it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]


nll mean: 130.77200317382812 	 kl mean: 0.04776104912161827 	 loss mean: 130.81976318359375
nll mean: 130.6614532470703 	 kl mean: 0.04776104912161827 	 loss mean: 130.709228515625
nll mean: 130.90647888183594 	 kl mean: 0.04776104912161827 	 loss mean: 130.95425415039062
nll mean: 130.85186767578125 	 kl mean: 0.04776104912161827 	 loss mean: 130.89962768554688


                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.62it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.70it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.85it/s][A
100%|██████████| 10/10 [00:00<00:00, 15.02it/s][A
 13%|█▎        | 5/38 [00:03<00:20,  1.63it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 130.70968627929688 	 kl mean: 0.04776104912161827 	 loss mean: 130.75746154785156
nll mean: 130.70404052734375 	 kl mean: 0.04776104912161827 	 loss mean: 130.75180053710938
nll mean: 130.76333618164062 	 kl mean: 0.04776104912161827 	 loss mean: 130.81109619140625
nll mean: 129.9357147216797 	 kl mean: 0.04873138666152954 	 loss mean: 129.98443603515625


                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.63it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.63it/s]
 20%|██        | 2/10 [00:00<00:00, 14.72it/s][A
                                              [A


nll mean: 129.9810791015625 	 kl mean: 0.04873138666152954 	 loss mean: 130.02980041503906
nll mean: 130.01971435546875 	 kl mean: 0.04873138666152954 	 loss mean: 130.06845092773438
nll mean: 129.91119384765625 	 kl mean: 0.04873138666152954 	 loss mean: 129.95993041992188


 13%|█▎        | 5/38 [00:03<00:20,  1.63it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.63it/s]
 40%|████      | 4/10 [00:00<00:00, 14.82it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.63it/s]
                                              [A
[A                                           

nll mean: 130.01866149902344 	 kl mean: 0.04873138666152954 	 loss mean: 130.06741333007812
nll mean: 129.896484375 	 kl mean: 0.04873138666152954 	 loss mean: 129.94522094726562
nll mean: 129.99554443359375 	 kl mean: 0.04873138666152954 	 loss mean: 130.0442657470703


 13%|█▎        | 5/38 [00:03<00:20,  1.63it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.89it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.63it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.63it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.84it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.74it/s][A
 16%|█▌        | 6/38 [00:03<00:20,  1.58it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.58it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.58it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 26.64it/s][A

nll mean: 129.99417114257812 	 kl mean: 0.04873138666152954 	 loss mean: 130.04290771484375
nll mean: 129.98007202148438 	 kl mean: 0.04873138666152954 	 loss mean: 130.02879333496094
nll mean: 129.85360717773438 	 kl mean: 0.04873138666152954 	 loss mean: 129.90232849121094
nll mean: 139.28872680664062 	 kl mean: 0.0448867566883564 	 loss mean: 139.3336181640625
nll mean: 139.3621826171875 	 kl mean: 0.0448867566883564 	 loss mean: 139.4070587158203
nll mean: 139.1987762451172 	 kl mean: 0.0448867566883564 	 loss mean: 139.24366760253906


                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.58it/s]
                                              [A
 16%|█▌        | 6/38 [00:03<00:20,  1.58it/s]
                                              [A
 16%|█▌        | 6/38 [00:03<00:20,  1.58it/s]
 30%|███       | 3/10 [00:00<00:00, 26.64it/s][A
                                              [A
 16%|█▌        | 6/38 [00:03<00:20,  1.58it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:20,  1.58it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:20,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 26.53it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 26.26it/s][A

nll mean: 139.23745727539062 	 kl mean: 0.0448867566883564 	 loss mean: 139.2823486328125
nll mean: 139.3018035888672 	 kl mean: 0.0448867566883564 	 loss mean: 139.34669494628906
nll mean: 139.31930541992188 	 kl mean: 0.0448867566883564 	 loss mean: 139.36419677734375
nll mean: 139.28538513183594 	 kl mean: 0.0448867566883564 	 loss mean: 139.3302764892578
nll mean: 139.29156494140625 	 kl mean: 0.0448867566883564 	 loss mean: 139.3364715576172
nll mean: 139.2534637451172 	 kl mean: 0.0448867566883564 	 loss mean: 139.29837036132812


                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.58it/s]
100%|██████████| 10/10 [00:00<00:00, 26.07it/s][A
 18%|█▊        | 7/38 [00:04<00:17,  1.79it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.79it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.79it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.79it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.79it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.79it/s]
 30%|███       | 3/10 [00:00<00:00, 25.78it/s][A

nll mean: 139.29823303222656 	 kl mean: 0.0448867566883564 	 loss mean: 139.34310913085938
nll mean: 111.09657287597656 	 kl mean: 0.05411272495985031 	 loss mean: 111.15068054199219
nll mean: 111.0618896484375 	 kl mean: 0.05411272495985031 	 loss mean: 111.11599731445312
nll mean: 111.14808654785156 	 kl mean: 0.05411272495985031 	 loss mean: 111.20219421386719
nll mean: 111.1703109741211 	 kl mean: 0.05411272495985031 	 loss mean: 111.22442626953125
nll mean: 111.0794677734375 	 kl mean: 0.05411272495985031 	 loss mean: 111.13357543945312


                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.79it/s]
 30%|███       | 3/10 [00:00<00:00, 25.78it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.79it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.79it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.79it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.76it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.79it/s]
100%|██████████| 10/10 [00:00<00:00, 25.78it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.97it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 111.06005859375 	 kl mean: 0.05411272495985031 	 loss mean: 111.11418151855469
nll mean: 111.15242004394531 	 kl mean: 0.05411272495985031 	 loss mean: 111.20652770996094
nll mean: 111.16270446777344 	 kl mean: 0.05411272495985031 	 loss mean: 111.2168197631836
nll mean: 111.14386749267578 	 kl mean: 0.05411272495985031 	 loss mean: 111.19798278808594
nll mean: 111.11915588378906 	 kl mean: 0.05411272495985031 	 loss mean: 111.17327880859375


                                              
 21%|██        | 8/38 [00:04<00:15,  1.97it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.97it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.97it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.97it/s]
 20%|██        | 2/10 [00:00<00:00, 16.14it/s][A
 40%|████      | 4/10 [00:00<00:00, 16.13it/s][A

nll mean: 137.30519104003906 	 kl mean: 0.047870535403490067 	 loss mean: 137.35305786132812
nll mean: 137.3903350830078 	 kl mean: 0.047870535403490067 	 loss mean: 137.43820190429688
nll mean: 137.34429931640625 	 kl mean: 0.047870535403490067 	 loss mean: 137.3921661376953
nll mean: 137.32688903808594 	 kl mean: 0.047870535403490067 	 loss mean: 137.374755859375


                                              
 21%|██        | 8/38 [00:04<00:15,  1.97it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.97it/s]
 40%|████      | 4/10 [00:00<00:00, 16.13it/s][A
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.97it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.97it/s]
 60%|██████    | 6/10 [00:00<00:00, 16.09it/s][A
 80%|████████  | 8/10 [00:00<00:00, 16.23it/s][A

nll mean: 137.3830108642578 	 kl mean: 0.047870535403490067 	 loss mean: 137.43087768554688
nll mean: 137.37254333496094 	 kl mean: 0.047870535403490067 	 loss mean: 137.42041015625
nll mean: 137.39349365234375 	 kl mean: 0.047870535403490067 	 loss mean: 137.44134521484375
nll mean: 137.25135803222656 	 kl mean: 0.047870535403490067 	 loss mean: 137.29922485351562


                                              
 21%|██        | 8/38 [00:05<00:15,  1.97it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.97it/s]
 80%|████████  | 8/10 [00:00<00:00, 16.23it/s][A
100%|██████████| 10/10 [00:00<00:00, 16.14it/s][A
 24%|██▎       | 9/38 [00:05<00:15,  1.84it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:15,  1.84it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:15,  1.84it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:15,  1.84it/s]


nll mean: 137.31344604492188 	 kl mean: 0.047870535403490067 	 loss mean: 137.36129760742188
nll mean: 137.3468475341797 	 kl mean: 0.047870535403490067 	 loss mean: 137.39471435546875
nll mean: 137.68832397460938 	 kl mean: 0.0455901175737381 	 loss mean: 137.73391723632812
nll mean: 137.76922607421875 	 kl mean: 0.0455901175737381 	 loss mean: 137.81478881835938
nll mean: 137.7592315673828 	 kl mean: 0.0455901175737381 	 loss mean: 137.80482482910156


  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:15,  1.84it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:15,  1.84it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:15,  1.84it/s]
 30%|███       | 3/10 [00:00<00:00, 22.55it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:15,  1.84it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:15,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.65it/s][A

nll mean: 137.75552368164062 	 kl mean: 0.0455901175737381 	 loss mean: 137.80111694335938
nll mean: 137.76759338378906 	 kl mean: 0.0455901175737381 	 loss mean: 137.8131866455078
nll mean: 137.79519653320312 	 kl mean: 0.0455901175737381 	 loss mean: 137.8407745361328
nll mean: 137.69810485839844 	 kl mean: 0.0455901175737381 	 loss mean: 137.7436981201172
nll mean: 137.77767944335938 	 kl mean: 0.0455901175737381 	 loss mean: 137.82327270507812


                                              
 24%|██▎       | 9/38 [00:05<00:15,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.65it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:15,  1.84it/s]
100%|██████████| 10/10 [00:00<00:00, 22.60it/s][A
 26%|██▋       | 10/38 [00:05<00:14,  1.95it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.95it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.95it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.95it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A


nll mean: 137.82003784179688 	 kl mean: 0.0455901175737381 	 loss mean: 137.86561584472656
nll mean: 137.77145385742188 	 kl mean: 0.0455901175737381 	 loss mean: 137.81704711914062
nll mean: 124.17491912841797 	 kl mean: 0.04020965099334717 	 loss mean: 124.21512603759766
nll mean: 124.0265884399414 	 kl mean: 0.04020965099334717 	 loss mean: 124.06678771972656
nll mean: 124.09330749511719 	 kl mean: 0.04020965099334717 	 loss mean: 124.13351440429688


 26%|██▋       | 10/38 [00:05<00:14,  1.95it/s]
                                               [A
 26%|██▋       | 10/38 [00:05<00:14,  1.95it/s]
                                               [A
 26%|██▋       | 10/38 [00:05<00:14,  1.95it/s]
 30%|███       | 3/10 [00:00<00:00, 25.84it/s][A
                                               [A
 26%|██▋       | 10/38 [00:05<00:14,  1.95it/s]
                                               [A
 26%|██▋       | 10/38 [00:05<00:14,  1.95it/s]
                                               [A
 26%|██▋       | 10/38 [00:05<00:14,  1.95it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.73it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.71it/s][A

nll mean: 124.22457885742188 	 kl mean: 0.04020965099334717 	 loss mean: 124.26478576660156
nll mean: 124.07648468017578 	 kl mean: 0.04020965099334717 	 loss mean: 124.11669921875
nll mean: 124.10625457763672 	 kl mean: 0.04020965099334717 	 loss mean: 124.14646911621094
nll mean: 124.04193878173828 	 kl mean: 0.04020965099334717 	 loss mean: 124.08213806152344
nll mean: 124.01429748535156 	 kl mean: 0.04020965099334717 	 loss mean: 124.05450439453125
nll mean: 124.04731750488281 	 kl mean: 0.04020965099334717 	 loss mean: 124.0875244140625


                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.95it/s]
100%|██████████| 10/10 [00:00<00:00, 25.61it/s][A
 29%|██▉       | 11/38 [00:05<00:12,  2.10it/s]
                                               
 29%|██▉       | 11/38 [00:05<00:12,  2.10it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:12,  2.10it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:12,  2.10it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:12,  2.10it/s]
 30%|███       | 3/10 [00:00<00:00, 23.26it/s][A

nll mean: 124.08744812011719 	 kl mean: 0.04020965099334717 	 loss mean: 124.12765502929688
nll mean: 146.88949584960938 	 kl mean: 0.043540000915527344 	 loss mean: 146.93304443359375
nll mean: 146.8841094970703 	 kl mean: 0.043540000915527344 	 loss mean: 146.9276580810547
nll mean: 146.91094970703125 	 kl mean: 0.043540000915527344 	 loss mean: 146.95448303222656
nll mean: 146.86026000976562 	 kl mean: 0.043540000915527344 	 loss mean: 146.90380859375


                                               
 29%|██▉       | 11/38 [00:06<00:12,  2.10it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:12,  2.10it/s]
 30%|███       | 3/10 [00:00<00:00, 23.26it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:12,  2.10it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:12,  2.10it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:12,  2.10it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.98it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.73it/s][A

nll mean: 146.91876220703125 	 kl mean: 0.043540000915527344 	 loss mean: 146.96231079101562
nll mean: 146.873291015625 	 kl mean: 0.043540000915527344 	 loss mean: 146.91683959960938
nll mean: 146.98089599609375 	 kl mean: 0.043540000915527344 	 loss mean: 147.02444458007812
nll mean: 146.8612060546875 	 kl mean: 0.043540000915527344 	 loss mean: 146.90475463867188
nll mean: 146.91207885742188 	 kl mean: 0.043540000915527344 	 loss mean: 146.95562744140625


                                               
 29%|██▉       | 11/38 [00:06<00:12,  2.10it/s]
100%|██████████| 10/10 [00:00<00:00, 22.42it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.13it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.13it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.13it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 13.06it/s][A

nll mean: 146.95425415039062 	 kl mean: 0.043540000915527344 	 loss mean: 146.997802734375
nll mean: 123.82749938964844 	 kl mean: 0.04781860113143921 	 loss mean: 123.87532043457031
nll mean: 123.82063293457031 	 kl mean: 0.04781860113143921 	 loss mean: 123.86844635009766


                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.13it/s]
                                               [A
 32%|███▏      | 12/38 [00:06<00:12,  2.13it/s]
 20%|██        | 2/10 [00:00<00:00, 13.06it/s][A
                                               [A
 32%|███▏      | 12/38 [00:06<00:12,  2.13it/s]
 40%|████      | 4/10 [00:00<00:00, 13.23it/s][A

nll mean: 123.77784729003906 	 kl mean: 0.04781860113143921 	 loss mean: 123.8256607055664
nll mean: 123.72196960449219 	 kl mean: 0.04781860113143921 	 loss mean: 123.76979064941406
nll mean: 123.7952880859375 	 kl mean: 0.04781860113143921 	 loss mean: 123.84310150146484


                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.13it/s]
 40%|████      | 4/10 [00:00<00:00, 13.23it/s][A
                                               [A
 32%|███▏      | 12/38 [00:06<00:12,  2.13it/s]
                                               [A
 32%|███▏      | 12/38 [00:06<00:12,  2.13it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.27it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.28it/s][A

nll mean: 123.79435729980469 	 kl mean: 0.04781860113143921 	 loss mean: 123.84217834472656
nll mean: 123.78305053710938 	 kl mean: 0.04781860113143921 	 loss mean: 123.83087158203125
nll mean: 123.81221008300781 	 kl mean: 0.04781860113143921 	 loss mean: 123.86002349853516


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.13it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.13it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.28it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.26it/s][A
 34%|███▍      | 13/38 [00:07<00:13,  1.80it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:13,  1.80it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 123.75711059570312 	 kl mean: 0.04781860113143921 	 loss mean: 123.804931640625
nll mean: 123.85856628417969 	 kl mean: 0.04781860113143921 	 loss mean: 123.90637969970703
nll mean: 167.9478759765625 	 kl mean: 0.05177302658557892 	 loss mean: 167.9996337890625


                                               
 34%|███▍      | 13/38 [00:07<00:13,  1.80it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:13,  1.80it/s]
                                               [A
 34%|███▍      | 13/38 [00:07<00:13,  1.80it/s]
 20%|██        | 2/10 [00:00<00:00, 10.64it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.55it/s][A

nll mean: 168.08328247070312 	 kl mean: 0.05177302658557892 	 loss mean: 168.13507080078125
nll mean: 167.97842407226562 	 kl mean: 0.05177302658557892 	 loss mean: 168.0301971435547
nll mean: 168.04464721679688 	 kl mean: 0.05177302658557892 	 loss mean: 168.09642028808594


                                               
 34%|███▍      | 13/38 [00:07<00:13,  1.80it/s]
                                               [A
 34%|███▍      | 13/38 [00:07<00:13,  1.80it/s]
 40%|████      | 4/10 [00:00<00:00, 10.55it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:13,  1.80it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.46it/s][A

nll mean: 168.08670043945312 	 kl mean: 0.05177302658557892 	 loss mean: 168.1384735107422
nll mean: 168.00778198242188 	 kl mean: 0.05177302658557892 	 loss mean: 168.05955505371094
nll mean: 168.0308837890625 	 kl mean: 0.05177302658557892 	 loss mean: 168.08267211914062


                                               
 34%|███▍      | 13/38 [00:07<00:13,  1.80it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.46it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:13,  1.80it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:13,  1.80it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.37it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.34it/s][A
 37%|███▋      | 14/38 [00:08<00:16,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 168.12356567382812 	 kl mean: 0.05177302658557892 	 loss mean: 168.17535400390625
nll mean: 168.0430908203125 	 kl mean: 0.05177302658557892 	 loss mean: 168.09487915039062
nll mean: 168.0677490234375 	 kl mean: 0.05177302658557892 	 loss mean: 168.1195068359375


                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.47it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.47it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.47it/s]
 20%|██        | 2/10 [00:00<00:00, 19.33it/s][A
 40%|████      | 4/10 [00:00<00:00, 19.03it/s][A

nll mean: 139.85110473632812 	 kl mean: 0.05442781746387482 	 loss mean: 139.90554809570312
nll mean: 139.85340881347656 	 kl mean: 0.05442781746387482 	 loss mean: 139.9078369140625
nll mean: 139.84906005859375 	 kl mean: 0.05442781746387482 	 loss mean: 139.90350341796875
nll mean: 139.8603515625 	 kl mean: 0.05442781746387482 	 loss mean: 139.91476440429688


                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.47it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.47it/s]
 40%|████      | 4/10 [00:00<00:00, 19.03it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.47it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.47it/s]
 60%|██████    | 6/10 [00:00<00:00, 18.88it/s][A
 80%|████████  | 8/10 [00:00<00:00, 18.85it/s][A

nll mean: 139.89077758789062 	 kl mean: 0.05442781746387482 	 loss mean: 139.94522094726562
nll mean: 139.89102172851562 	 kl mean: 0.05442781746387482 	 loss mean: 139.94546508789062
nll mean: 139.80401611328125 	 kl mean: 0.05442781746387482 	 loss mean: 139.8584442138672
nll mean: 139.95733642578125 	 kl mean: 0.05442781746387482 	 loss mean: 140.01177978515625


                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.47it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 18.85it/s][A
100%|██████████| 10/10 [00:00<00:00, 18.70it/s][A
 39%|███▉      | 15/38 [00:08<00:14,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 139.85205078125 	 kl mean: 0.05442781746387482 	 loss mean: 139.90647888183594
nll mean: 139.83084106445312 	 kl mean: 0.05442781746387482 	 loss mean: 139.88528442382812


                                               
 39%|███▉      | 15/38 [00:08<00:14,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 39%|███▉      | 15/38 [00:08<00:14,  1.57it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:14,  1.57it/s]
 10%|█         | 1/10 [00:00<00:01,  5.73it/s][A
 30%|███       | 3/10 [00:00<00:01,  6.70it/s][A

nll mean: 148.16128540039062 	 kl mean: 0.04723987728357315 	 loss mean: 148.20852661132812
nll mean: 148.16360473632812 	 kl mean: 0.04723987728357315 	 loss mean: 148.21084594726562
nll mean: 148.12545776367188 	 kl mean: 0.04723987728357315 	 loss mean: 148.17269897460938


                                               
 39%|███▉      | 15/38 [00:09<00:14,  1.57it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:14,  1.57it/s]
 30%|███       | 3/10 [00:00<00:01,  6.70it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:14,  1.57it/s]
 50%|█████     | 5/10 [00:00<00:00,  7.63it/s][A

nll mean: 148.12660217285156 	 kl mean: 0.04723987728357315 	 loss mean: 148.173828125
nll mean: 148.09280395507812 	 kl mean: 0.04723987728357315 	 loss mean: 148.14004516601562
nll mean: 148.0509033203125 	 kl mean: 0.04723987728357315 	 loss mean: 148.09815979003906


                                               
 39%|███▉      | 15/38 [00:09<00:14,  1.57it/s]
 50%|█████     | 5/10 [00:00<00:00,  7.63it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:14,  1.57it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:14,  1.57it/s]
 70%|███████   | 7/10 [00:00<00:00,  8.35it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.02it/s][A

nll mean: 148.1097869873047 	 kl mean: 0.04723987728357315 	 loss mean: 148.1570281982422
nll mean: 148.12783813476562 	 kl mean: 0.04723987728357315 	 loss mean: 148.17507934570312
nll mean: 148.10055541992188 	 kl mean: 0.04723987728357315 	 loss mean: 148.1477813720703


                                               
 39%|███▉      | 15/38 [00:09<00:14,  1.57it/s]
100%|██████████| 10/10 [00:00<00:00, 10.12it/s][A
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
                                               
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
                                               
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
                                               
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
 30%|███       | 3/10 [00:00<00:00, 25.46it/s][A

nll mean: 148.11546325683594 	 kl mean: 0.04723987728357315 	 loss mean: 148.16270446777344
nll mean: 150.4879913330078 	 kl mean: 0.05448995903134346 	 loss mean: 150.54248046875
nll mean: 150.40109252929688 	 kl mean: 0.05448995903134346 	 loss mean: 150.45559692382812
nll mean: 150.446533203125 	 kl mean: 0.05448995903134346 	 loss mean: 150.5010223388672
nll mean: 150.3585662841797 	 kl mean: 0.05448995903134346 	 loss mean: 150.41305541992188


                                               
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
                                               [A
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
 30%|███       | 3/10 [00:00<00:00, 25.46it/s][A
                                               [A
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
                                               [A
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
                                               [A
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.20it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
100%|██████████| 10/10 [00:00<00:00, 25.12it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]

nll mean: 150.48992919921875 	 kl mean: 0.05448995903134346 	 loss mean: 150.54443359375
nll mean: 150.46929931640625 	 kl mean: 0.05448995903134346 	 loss mean: 150.5238037109375
nll mean: 150.40951538085938 	 kl mean: 0.05448995903134346 	 loss mean: 150.46401977539062
nll mean: 150.37576293945312 	 kl mean: 0.05448995903134346 	 loss mean: 150.43023681640625
nll mean: 150.4910125732422 	 kl mean: 0.05448995903134346 	 loss mean: 150.54550170898438
nll mean: 150.41995239257812 	 kl mean: 0.05448995903134346 	 loss mean: 150.4744415283203



                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
 30%|███       | 3/10 [00:00<00:00, 25.88it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.80it/s][A

nll mean: 139.6370849609375 	 kl mean: 0.048931967467069626 	 loss mean: 139.68600463867188
nll mean: 139.59637451171875 	 kl mean: 0.048931967467069626 	 loss mean: 139.64532470703125
nll mean: 139.5876007080078 	 kl mean: 0.048931967467069626 	 loss mean: 139.63653564453125
nll mean: 139.59042358398438 	 kl mean: 0.048931967467069626 	 loss mean: 139.6393585205078
nll mean: 139.59445190429688 	 kl mean: 0.048931967467069626 	 loss mean: 139.6433868408203
nll mean: 139.6038818359375 	 kl mean: 0.048931967467069626 	 loss mean: 139.65281677246094


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.80it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
100%|██████████| 10/10 [00:00<00:00, 25.75it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 139.6312255859375 	 kl mean: 0.048931967467069626 	 loss mean: 139.68016052246094
nll mean: 139.63644409179688 	 kl mean: 0.048931967467069626 	 loss mean: 139.68536376953125
nll mean: 139.625 	 kl mean: 0.048931967467069626 	 loss mean: 139.67391967773438
nll mean: 139.71087646484375 	 kl mean: 0.048931967467069626 	 loss mean: 139.7598114013672
nll mean: 136.82411193847656 	 kl mean: 0.048692379146814346 	 loss mean: 136.87281799316406


                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s]
                                               [A
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s]
 20%|██        | 2/10 [00:00<00:00, 13.16it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.17it/s][A

nll mean: 136.73731994628906 	 kl mean: 0.048692379146814346 	 loss mean: 136.7860107421875
nll mean: 136.7637939453125 	 kl mean: 0.048692379146814346 	 loss mean: 136.8125
nll mean: 136.7889404296875 	 kl mean: 0.048692379146814346 	 loss mean: 136.837646484375


                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s]
                                               [A
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s]
 40%|████      | 4/10 [00:00<00:00, 13.17it/s][A
                                               [A
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.14it/s][A

nll mean: 136.80453491210938 	 kl mean: 0.048692379146814346 	 loss mean: 136.85321044921875
nll mean: 136.7576141357422 	 kl mean: 0.048692379146814346 	 loss mean: 136.80630493164062
nll mean: 136.7556915283203 	 kl mean: 0.048692379146814346 	 loss mean: 136.80438232421875


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.77it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.14it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.77it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.77it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.22it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.19it/s][A
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 136.80108642578125 	 kl mean: 0.048692379146814346 	 loss mean: 136.84979248046875
nll mean: 136.7452850341797 	 kl mean: 0.048692379146814346 	 loss mean: 136.79397583007812
nll mean: 136.76661682128906 	 kl mean: 0.048692379146814346 	 loss mean: 136.8153076171875


                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
 20%|██        | 2/10 [00:00<00:00, 13.16it/s][A

nll mean: 154.3721923828125 	 kl mean: 0.04129062592983246 	 loss mean: 154.41348266601562
nll mean: 154.35366821289062 	 kl mean: 0.04129062592983246 	 loss mean: 154.39495849609375
nll mean: 154.38937377929688 	 kl mean: 0.04129062592983246 	 loss mean: 154.4306640625


                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
 20%|██        | 2/10 [00:00<00:00, 13.16it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
                                               [A
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
 40%|████      | 4/10 [00:00<00:00, 12.97it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.75it/s][A

nll mean: 154.42678833007812 	 kl mean: 0.04129062592983246 	 loss mean: 154.46807861328125
nll mean: 154.37841796875 	 kl mean: 0.04129062592983246 	 loss mean: 154.41970825195312
nll mean: 154.41189575195312 	 kl mean: 0.04129062592983246 	 loss mean: 154.45318603515625


                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
                                               [A
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.75it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.66it/s][A

nll mean: 154.40228271484375 	 kl mean: 0.04129062592983246 	 loss mean: 154.44358825683594
nll mean: 154.48602294921875 	 kl mean: 0.04129062592983246 	 loss mean: 154.52731323242188
nll mean: 154.3665313720703 	 kl mean: 0.04129062592983246 	 loss mean: 154.40782165527344


                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.66it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.64it/s][A
 53%|█████▎    | 20/38 [00:11<00:12,  1.48it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.48it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 13.45it/s][A

nll mean: 154.3819580078125 	 kl mean: 0.04129062592983246 	 loss mean: 154.4232635498047
nll mean: 162.278076171875 	 kl mean: 0.051538869738578796 	 loss mean: 162.32962036132812
nll mean: 162.4276123046875 	 kl mean: 0.051538869738578796 	 loss mean: 162.4791717529297


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.48it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 13.45it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 13.27it/s][A

nll mean: 162.36317443847656 	 kl mean: 0.051538869738578796 	 loss mean: 162.4147186279297
nll mean: 162.39633178710938 	 kl mean: 0.051538869738578796 	 loss mean: 162.4478759765625
nll mean: 162.3719940185547 	 kl mean: 0.051538869738578796 	 loss mean: 162.4235382080078


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 13.27it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.48it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.29it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.13it/s][A

nll mean: 162.45901489257812 	 kl mean: 0.051538869738578796 	 loss mean: 162.51055908203125
nll mean: 162.35365295410156 	 kl mean: 0.051538869738578796 	 loss mean: 162.4051971435547
nll mean: 162.34422302246094 	 kl mean: 0.051538869738578796 	 loss mean: 162.39576721191406


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.48it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.13it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.08it/s][A
 55%|█████▌    | 21/38 [00:12<00:11,  1.42it/s]
                                               
 55%|█████▌    | 21/38 [00:12<00:11,  1.42it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 162.36073303222656 	 kl mean: 0.051538869738578796 	 loss mean: 162.4122772216797
nll mean: 162.3109130859375 	 kl mean: 0.051538869738578796 	 loss mean: 162.36244201660156
nll mean: 122.99360656738281 	 kl mean: 0.050619229674339294 	 loss mean: 123.04422760009766


                                               
 55%|█████▌    | 21/38 [00:12<00:11,  1.42it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
 20%|██        | 2/10 [00:00<00:00, 10.61it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.64it/s][A

nll mean: 122.94168090820312 	 kl mean: 0.050619229674339294 	 loss mean: 122.9923095703125
nll mean: 123.08374786376953 	 kl mean: 0.050619229674339294 	 loss mean: 123.13436889648438
nll mean: 123.02388000488281 	 kl mean: 0.050619229674339294 	 loss mean: 123.07449340820312


                                               
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
 40%|████      | 4/10 [00:00<00:00, 10.64it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.42it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.41it/s][A

nll mean: 123.08302307128906 	 kl mean: 0.050619229674339294 	 loss mean: 123.13363647460938
nll mean: 123.00570678710938 	 kl mean: 0.050619229674339294 	 loss mean: 123.05632781982422
nll mean: 123.02096557617188 	 kl mean: 0.050619229674339294 	 loss mean: 123.07159423828125


                                               
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.41it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
100%|██████████| 10/10 [00:00<00:00, 10.45it/s][A
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 123.01097869873047 	 kl mean: 0.050619229674339294 	 loss mean: 123.06159210205078
nll mean: 123.10337829589844 	 kl mean: 0.050619229674339294 	 loss mean: 123.15399932861328
nll mean: 122.98094177246094 	 kl mean: 0.050619229674339294 	 loss mean: 123.03156280517578


                                               
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               [A
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               [A
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
 40%|████      | 4/10 [00:00<00:00, 33.99it/s][A

nll mean: 111.08336639404297 	 kl mean: 0.03705066442489624 	 loss mean: 111.12041473388672
nll mean: 111.16178894042969 	 kl mean: 0.03705066442489624 	 loss mean: 111.19883728027344
nll mean: 111.05941772460938 	 kl mean: 0.03705066442489624 	 loss mean: 111.09646606445312
nll mean: 111.07101440429688 	 kl mean: 0.03705066442489624 	 loss mean: 111.10807037353516
nll mean: 111.06932067871094 	 kl mean: 0.03705066442489624 	 loss mean: 111.10637664794922
nll mean: 111.09368896484375 	 kl mean: 0.03705066442489624 	 loss mean: 111.1307373046875
nll mean: 111.0545654296875 	 kl mean: 0.03705066442489624 	 loss mean: 111.09161376953125


                                               
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
 40%|████      | 4/10 [00:00<00:00, 33.99it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.28it/s]
100%|██████████| 10/10 [00:00<00:00, 33.64it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.92it/s][A

nll mean: 111.14800262451172 	 kl mean: 0.03705066442489624 	 loss mean: 111.18505859375
nll mean: 111.12077331542969 	 kl mean: 0.03705066442489624 	 loss mean: 111.15782165527344
nll mean: 111.08759307861328 	 kl mean: 0.03705066442489624 	 loss mean: 111.1246337890625
nll mean: 163.18692016601562 	 kl mean: 0.044066667556762695 	 loss mean: 163.2310028076172
nll mean: 163.27056884765625 	 kl mean: 0.044066667556762695 	 loss mean: 163.31463623046875


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 14.92it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
 40%|████      | 4/10 [00:00<00:00, 15.04it/s][A
 60%|██████    | 6/10 [00:00<00:00, 15.03it/s][A

nll mean: 163.1605682373047 	 kl mean: 0.044066667556762695 	 loss mean: 163.2046356201172
nll mean: 163.28250122070312 	 kl mean: 0.044066667556762695 	 loss mean: 163.32656860351562
nll mean: 163.2164306640625 	 kl mean: 0.044066667556762695 	 loss mean: 163.260498046875
nll mean: 163.20176696777344 	 kl mean: 0.044066667556762695 	 loss mean: 163.24583435058594


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 15.03it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 15.10it/s]

nll mean: 163.24337768554688 	 kl mean: 0.044066667556762695 	 loss mean: 163.28744506835938
nll mean: 163.23580932617188 	 kl mean: 0.044066667556762695 	 loss mean: 163.27987670898438
nll mean: 163.24322509765625 	 kl mean: 0.044066667556762695 	 loss mean: 163.28729248046875
nll mean: 163.31378173828125 	 kl mean: 0.044066667556762695 	 loss mean: 163.35784912109375


[A
100%|██████████| 10/10 [00:00<00:00, 15.06it/s][A
 63%|██████▎   | 24/38 [00:14<00:09,  1.55it/s]
                                               
 63%|██████▎   | 24/38 [00:14<00:09,  1.55it/s]
                                               
 63%|██████▎   | 24/38 [00:14<00:09,  1.55it/s]
                                               
 63%|██████▎   | 24/38 [00:14<00:09,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:14<00:09,  1.55it/s]
                                               [A
 63%|██████▎   | 24/38 [00:14<00:09,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 23.04it/s][A

nll mean: 126.6549072265625 	 kl mean: 0.05070033296942711 	 loss mean: 126.70560455322266
nll mean: 126.6418685913086 	 kl mean: 0.05070033296942711 	 loss mean: 126.69257354736328
nll mean: 126.67766571044922 	 kl mean: 0.05070033296942711 	 loss mean: 126.72836303710938
nll mean: 126.6008071899414 	 kl mean: 0.05070033296942711 	 loss mean: 126.65150451660156
nll mean: 126.66487121582031 	 kl mean: 0.05070033296942711 	 loss mean: 126.715576171875


                                               
 63%|██████▎   | 24/38 [00:14<00:09,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 23.04it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:14<00:09,  1.55it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.55it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.85it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.55it/s]
100%|██████████| 10/10 [00:00<00:00, 22.58it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 126.61937713623047 	 kl mean: 0.05070033296942711 	 loss mean: 126.67007446289062
nll mean: 126.55254364013672 	 kl mean: 0.05070033296942711 	 loss mean: 126.60324096679688
nll mean: 126.62687683105469 	 kl mean: 0.05070033296942711 	 loss mean: 126.67758178710938
nll mean: 126.67495727539062 	 kl mean: 0.05070033296942711 	 loss mean: 126.72564697265625
nll mean: 126.6615982055664 	 kl mean: 0.05070033296942711 	 loss mean: 126.71229553222656


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.71it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.71it/s]
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.71it/s]
 20%|██        | 2/10 [00:00<00:00, 14.89it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.99it/s][A

nll mean: 120.85668182373047 	 kl mean: 0.04911566898226738 	 loss mean: 120.90580749511719
nll mean: 120.85855102539062 	 kl mean: 0.04911566898226738 	 loss mean: 120.90766906738281
nll mean: 120.93985748291016 	 kl mean: 0.04911566898226738 	 loss mean: 120.98896789550781
nll mean: 120.93240356445312 	 kl mean: 0.04911566898226738 	 loss mean: 120.98152923583984


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.71it/s]
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.71it/s]
 40%|████      | 4/10 [00:00<00:00, 14.99it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.71it/s]
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.97it/s][A
 80%|████████  | 8/10 [00:00<00:00, 15.09it/s][A

nll mean: 120.83667755126953 	 kl mean: 0.04911566898226738 	 loss mean: 120.88578796386719
nll mean: 120.86384582519531 	 kl mean: 0.04911566898226738 	 loss mean: 120.9129638671875
nll mean: 120.82939147949219 	 kl mean: 0.04911566898226738 	 loss mean: 120.87850952148438
nll mean: 120.93290710449219 	 kl mean: 0.04911566898226738 	 loss mean: 120.98202514648438


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.71it/s]
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.71it/s]
 80%|████████  | 8/10 [00:00<00:00, 15.09it/s][A
100%|██████████| 10/10 [00:00<00:00, 15.06it/s][A
 68%|██████▊   | 26/38 [00:15<00:07,  1.64it/s]
                                               
 68%|██████▊   | 26/38 [00:15<00:07,  1.64it/s]
                                               
 68%|██████▊   | 26/38 [00:15<00:07,  1.64it/s]
                                               
 68%|██████▊   | 26/38 [00:15<00:07,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 24.52it/s][A

nll mean: 120.83952331542969 	 kl mean: 0.04911566898226738 	 loss mean: 120.8886489868164
nll mean: 120.87763977050781 	 kl mean: 0.04911566898226738 	 loss mean: 120.9267578125
nll mean: 87.38822937011719 	 kl mean: 0.06718866527080536 	 loss mean: 87.4554214477539
nll mean: 87.26229858398438 	 kl mean: 0.06718866527080536 	 loss mean: 87.32948303222656
nll mean: 87.23686218261719 	 kl mean: 0.06718866527080536 	 loss mean: 87.30404663085938


                                               
 68%|██████▊   | 26/38 [00:15<00:07,  1.64it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.64it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.64it/s]
 30%|███       | 3/10 [00:00<00:00, 24.52it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.64it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 23.93it/s][A

nll mean: 87.25776672363281 	 kl mean: 0.06718866527080536 	 loss mean: 87.32495880126953
nll mean: 87.29661560058594 	 kl mean: 0.06718866527080536 	 loss mean: 87.36380004882812
nll mean: 87.36997985839844 	 kl mean: 0.06718866527080536 	 loss mean: 87.43717193603516
nll mean: 87.30328369140625 	 kl mean: 0.06718866527080536 	 loss mean: 87.37046813964844
nll mean: 87.48463439941406 	 kl mean: 0.06718866527080536 	 loss mean: 87.55181884765625


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 23.93it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.64it/s]
100%|██████████| 10/10 [00:00<00:00, 23.64it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.80it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.80it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.80it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.80it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 22.78it/s][A

nll mean: 87.35078430175781 	 kl mean: 0.06718866527080536 	 loss mean: 87.41797637939453
nll mean: 87.26725769042969 	 kl mean: 0.06718866527080536 	 loss mean: 87.33444213867188
nll mean: 113.91921997070312 	 kl mean: 0.04064653813838959 	 loss mean: 113.95986938476562
nll mean: 113.87156677246094 	 kl mean: 0.04064653813838959 	 loss mean: 113.9122085571289
nll mean: 114.02363586425781 	 kl mean: 0.04064653813838959 	 loss mean: 114.06428527832031


                                               
 71%|███████   | 27/38 [00:16<00:06,  1.80it/s]
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.80it/s]
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.80it/s]
 30%|███       | 3/10 [00:00<00:00, 22.78it/s][A
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.80it/s]
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.80it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.88it/s][A

nll mean: 113.96073150634766 	 kl mean: 0.04064653813838959 	 loss mean: 114.00138092041016
nll mean: 113.9397201538086 	 kl mean: 0.04064653813838959 	 loss mean: 113.98036193847656
nll mean: 113.86056518554688 	 kl mean: 0.04064653813838959 	 loss mean: 113.90121459960938
nll mean: 113.9125747680664 	 kl mean: 0.04064653813838959 	 loss mean: 113.95321655273438
nll mean: 113.84732818603516 	 kl mean: 0.04064653813838959 	 loss mean: 113.88796997070312


                                               
 71%|███████   | 27/38 [00:16<00:06,  1.80it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.88it/s][A
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.80it/s]
100%|██████████| 10/10 [00:00<00:00, 22.81it/s][A
 74%|███████▎  | 28/38 [00:16<00:05,  1.92it/s]
                                               
 74%|███████▎  | 28/38 [00:16<00:05,  1.92it/s]
                                               

nll mean: 113.90592956542969 	 kl mean: 0.04064653813838959 	 loss mean: 113.94657897949219
nll mean: 113.93901824951172 	 kl mean: 0.04064653813838959 	 loss mean: 113.97966003417969
nll mean: 126.03528594970703 	 kl mean: 0.04468752071261406 	 loss mean: 126.0799789428711



 74%|███████▎  | 28/38 [00:16<00:05,  1.92it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:16<00:05,  1.92it/s]
                                               [A
 74%|███████▎  | 28/38 [00:16<00:05,  1.92it/s]
 20%|██        | 2/10 [00:00<00:00, 12.89it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.96it/s][A

nll mean: 126.02159118652344 	 kl mean: 0.04468752071261406 	 loss mean: 126.0662841796875
nll mean: 126.03189086914062 	 kl mean: 0.04468752071261406 	 loss mean: 126.07657623291016
nll mean: 126.00756072998047 	 kl mean: 0.04468752071261406 	 loss mean: 126.05224609375


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.92it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.92it/s]
 40%|████      | 4/10 [00:00<00:00, 12.96it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.92it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.04it/s][A

nll mean: 126.05352783203125 	 kl mean: 0.04468752071261406 	 loss mean: 126.09821319580078
nll mean: 126.00164031982422 	 kl mean: 0.04468752071261406 	 loss mean: 126.04633331298828
nll mean: 126.04566955566406 	 kl mean: 0.04468752071261406 	 loss mean: 126.0903549194336


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.92it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.04it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.92it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.92it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.96it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.01it/s][A
 76%|███████▋  | 29/38 [00:17<00:05,  1.68it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 126.03955841064453 	 kl mean: 0.04468752071261406 	 loss mean: 126.08423614501953
nll mean: 125.98297882080078 	 kl mean: 0.04468752071261406 	 loss mean: 126.02766418457031
nll mean: 125.93392944335938 	 kl mean: 0.04468752071261406 	 loss mean: 125.97862243652344


                                               
 76%|███████▋  | 29/38 [00:17<00:05,  1.68it/s]
                                               
 76%|███████▋  | 29/38 [00:17<00:05,  1.68it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:17<00:05,  1.68it/s]
 20%|██        | 2/10 [00:00<00:00, 10.65it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.39it/s][A

nll mean: 66.85952758789062 	 kl mean: 0.04071469232439995 	 loss mean: 66.90023803710938
nll mean: 66.7532730102539 	 kl mean: 0.04071469232439995 	 loss mean: 66.79399108886719
nll mean: 66.79357147216797 	 kl mean: 0.04071469232439995 	 loss mean: 66.83428192138672


                                               
 76%|███████▋  | 29/38 [00:17<00:05,  1.68it/s]
                                               [A
 76%|███████▋  | 29/38 [00:17<00:05,  1.68it/s]
 30%|███       | 3/10 [00:00<00:00, 10.39it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.68it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.35it/s][A

nll mean: 66.76814270019531 	 kl mean: 0.04071469232439995 	 loss mean: 66.80885314941406
nll mean: 66.86251068115234 	 kl mean: 0.04071469232439995 	 loss mean: 66.90322875976562
nll mean: 66.72632598876953 	 kl mean: 0.04071469232439995 	 loss mean: 66.76704406738281


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.68it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.35it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.68it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.68it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.41it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 10.45it/s][A

nll mean: 66.83220672607422 	 kl mean: 0.04071469232439995 	 loss mean: 66.87291717529297
nll mean: 66.79132843017578 	 kl mean: 0.04071469232439995 	 loss mean: 66.83204650878906
nll mean: 66.78077697753906 	 kl mean: 0.04071469232439995 	 loss mean: 66.82150268554688


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.68it/s]
100%|██████████| 10/10 [00:00<00:00, 10.42it/s][A
 79%|███████▉  | 30/38 [00:18<00:05,  1.42it/s]
                                               
 79%|███████▉  | 30/38 [00:18<00:05,  1.42it/s]
                                               
 79%|███████▉  | 30/38 [00:18<00:05,  1.42it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 13.39it/s][A

nll mean: 66.76252746582031 	 kl mean: 0.04071469232439995 	 loss mean: 66.8032455444336
nll mean: 110.1387710571289 	 kl mean: 0.053182847797870636 	 loss mean: 110.19195556640625
nll mean: 110.14713287353516 	 kl mean: 0.053182847797870636 	 loss mean: 110.2003173828125


                                               
 79%|███████▉  | 30/38 [00:18<00:05,  1.42it/s]
                                               [A
 79%|███████▉  | 30/38 [00:18<00:05,  1.42it/s]
 20%|██        | 2/10 [00:00<00:00, 13.39it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:18<00:05,  1.42it/s]
 40%|████      | 4/10 [00:00<00:00, 13.32it/s][A

nll mean: 110.18644714355469 	 kl mean: 0.053182847797870636 	 loss mean: 110.23963165283203
nll mean: 110.24948120117188 	 kl mean: 0.053182847797870636 	 loss mean: 110.30266571044922
nll mean: 110.218994140625 	 kl mean: 0.053182847797870636 	 loss mean: 110.27218627929688


                                               
 79%|███████▉  | 30/38 [00:18<00:05,  1.42it/s]
 40%|████      | 4/10 [00:00<00:00, 13.32it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:18<00:05,  1.42it/s]
                                               [A
 79%|███████▉  | 30/38 [00:18<00:05,  1.42it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.38it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.22it/s][A

nll mean: 110.1269302368164 	 kl mean: 0.053182847797870636 	 loss mean: 110.18011474609375
nll mean: 110.15943145751953 	 kl mean: 0.053182847797870636 	 loss mean: 110.21261596679688
nll mean: 110.15855407714844 	 kl mean: 0.053182847797870636 	 loss mean: 110.21173095703125


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.42it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.42it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.22it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.19it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.38it/s]
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 110.20198822021484 	 kl mean: 0.053182847797870636 	 loss mean: 110.25517272949219
nll mean: 110.17737579345703 	 kl mean: 0.053182847797870636 	 loss mean: 110.23056030273438
nll mean: 142.90060424804688 	 kl mean: 0.05795404314994812 	 loss mean: 142.95855712890625


                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:19<00:05,  1.38it/s]
                                               [A
 82%|████████▏ | 31/38 [00:19<00:05,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 10.63it/s][A

nll mean: 142.91737365722656 	 kl mean: 0.05795404314994812 	 loss mean: 142.975341796875
nll mean: 143.02847290039062 	 kl mean: 0.05795404314994812 	 loss mean: 143.08642578125
nll mean: 142.92129516601562 	 kl mean: 0.05795404314994812 	 loss mean: 142.979248046875



                                               [A
 82%|████████▏ | 31/38 [00:19<00:05,  1.38it/s]
                                               [A
 82%|████████▏ | 31/38 [00:19<00:05,  1.38it/s]
 40%|████      | 4/10 [00:00<00:00, 10.44it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:19<00:05,  1.38it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.41it/s][A

nll mean: 143.0111541748047 	 kl mean: 0.05795404314994812 	 loss mean: 143.069091796875
nll mean: 142.98828125 	 kl mean: 0.05795404314994812 	 loss mean: 143.04623413085938
nll mean: 142.89666748046875 	 kl mean: 0.05795404314994812 	 loss mean: 142.95462036132812


                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.38it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.41it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.38it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.38it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.33it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.27it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 143.00408935546875 	 kl mean: 0.05795404314994812 	 loss mean: 143.06204223632812
nll mean: 142.97418212890625 	 kl mean: 0.05795404314994812 	 loss mean: 143.03213500976562
nll mean: 142.88555908203125 	 kl mean: 0.05795404314994812 	 loss mean: 142.94351196289062


                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.25it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.25it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.25it/s]
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.25it/s]
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.25it/s]
 30%|███       | 3/10 [00:00<00:00, 26.96it/s][A
 60%|██████    | 6/10 [00:00<00:00, 26.58it/s][A

nll mean: 68.39159393310547 	 kl mean: 0.04233042150735855 	 loss mean: 68.43392944335938
nll mean: 68.46772766113281 	 kl mean: 0.04233042150735855 	 loss mean: 68.51005554199219
nll mean: 68.40415954589844 	 kl mean: 0.04233042150735855 	 loss mean: 68.44650268554688
nll mean: 68.47545623779297 	 kl mean: 0.04233042150735855 	 loss mean: 68.51778411865234
nll mean: 68.46492767333984 	 kl mean: 0.04233042150735855 	 loss mean: 68.50726318359375
nll mean: 68.41340637207031 	 kl mean: 0.04233042150735855 	 loss mean: 68.45574188232422


                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.25it/s]
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.25it/s]
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.25it/s]
 60%|██████    | 6/10 [00:00<00:00, 26.58it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.25it/s]
100%|██████████| 10/10 [00:00<00:00, 26.32it/s][A
 87%|████████▋ | 33/38 [00:20<00:03,  1.48it/s]
                                               
 87%|████████▋ | 33/38 [00:20<00:03,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 68.437744140625 	 kl mean: 0.04233042150735855 	 loss mean: 68.48007202148438
nll mean: 68.54057312011719 	 kl mean: 0.04233042150735855 	 loss mean: 68.5829086303711
nll mean: 68.45260620117188 	 kl mean: 0.04233042150735855 	 loss mean: 68.49493408203125
nll mean: 68.47648620605469 	 kl mean: 0.04233042150735855 	 loss mean: 68.51881408691406
nll mean: 123.896484375 	 kl mean: 0.0475754588842392 	 loss mean: 123.94406127929688


                                               
 87%|████████▋ | 33/38 [00:20<00:03,  1.48it/s]
                                               
 87%|████████▋ | 33/38 [00:20<00:03,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:20<00:03,  1.48it/s]
                                               [A
 87%|████████▋ | 33/38 [00:20<00:03,  1.48it/s]
                                               [A
 87%|████████▋ | 33/38 [00:20<00:03,  1.48it/s]
 30%|███       | 3/10 [00:00<00:00, 22.66it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.76it/s][A

nll mean: 123.94340515136719 	 kl mean: 0.0475754588842392 	 loss mean: 123.9909896850586
nll mean: 123.94403839111328 	 kl mean: 0.0475754588842392 	 loss mean: 123.99160766601562
nll mean: 123.962646484375 	 kl mean: 0.0475754588842392 	 loss mean: 124.01022338867188
nll mean: 123.96127319335938 	 kl mean: 0.0475754588842392 	 loss mean: 124.00885009765625
nll mean: 123.9788589477539 	 kl mean: 0.0475754588842392 	 loss mean: 124.02643585205078


                                               
 87%|████████▋ | 33/38 [00:20<00:03,  1.48it/s]
                                               [A
 87%|████████▋ | 33/38 [00:20<00:03,  1.48it/s]
                                               [A
 87%|████████▋ | 33/38 [00:20<00:03,  1.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.76it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:20<00:03,  1.48it/s]
100%|██████████| 10/10 [00:00<00:00, 22.47it/s][A
 89%|████████▉ | 34/38 [00:20<00:02,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 123.92646789550781 	 kl mean: 0.0475754588842392 	 loss mean: 123.97404479980469
nll mean: 124.04795837402344 	 kl mean: 0.0475754588842392 	 loss mean: 124.09552764892578
nll mean: 123.96575164794922 	 kl mean: 0.0475754588842392 	 loss mean: 124.01333618164062
nll mean: 123.95515441894531 	 kl mean: 0.0475754588842392 	 loss mean: 124.00273895263672


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.65it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 12.60it/s][A

nll mean: 124.80899810791016 	 kl mean: 0.03724836930632591 	 loss mean: 124.84625244140625
nll mean: 124.86260986328125 	 kl mean: 0.03724836930632591 	 loss mean: 124.89985656738281
nll mean: 124.78804016113281 	 kl mean: 0.03724836930632591 	 loss mean: 124.82528686523438


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 12.60it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.65it/s]
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.65it/s]
 40%|████      | 4/10 [00:00<00:00, 12.79it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.83it/s][A

nll mean: 124.83880615234375 	 kl mean: 0.03724836930632591 	 loss mean: 124.87605285644531
nll mean: 124.8292236328125 	 kl mean: 0.03724836930632591 	 loss mean: 124.86647033691406
nll mean: 124.89718627929688 	 kl mean: 0.03724836930632591 	 loss mean: 124.93444061279297


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.65it/s]
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.65it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.83it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.65it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.88it/s][A

nll mean: 124.92320251464844 	 kl mean: 0.03724836930632591 	 loss mean: 124.96045684814453
nll mean: 124.83650207519531 	 kl mean: 0.03724836930632591 	 loss mean: 124.8737564086914
nll mean: 124.85816192626953 	 kl mean: 0.03724836930632591 	 loss mean: 124.89541625976562


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.65it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.88it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.99it/s][A
 92%|█████████▏| 35/38 [00:21<00:01,  1.53it/s]
                                               
 92%|█████████▏| 35/38 [00:21<00:01,  1.53it/s]
                                               
 92%|█████████▏| 35/38 [00:21<00:01,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.95it/s][A

nll mean: 124.85408020019531 	 kl mean: 0.03724836930632591 	 loss mean: 124.8913345336914
nll mean: 118.63619995117188 	 kl mean: 0.053908638656139374 	 loss mean: 118.69010925292969
nll mean: 118.48933410644531 	 kl mean: 0.053908638656139374 	 loss mean: 118.54325103759766


                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.53it/s]
                                               [A
 92%|█████████▏| 35/38 [00:22<00:01,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 10.95it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:22<00:01,  1.53it/s]
 40%|████      | 4/10 [00:00<00:00, 10.93it/s][A

nll mean: 118.500732421875 	 kl mean: 0.053908638656139374 	 loss mean: 118.55464172363281
nll mean: 118.52779388427734 	 kl mean: 0.053908638656139374 	 loss mean: 118.58171081542969
nll mean: 118.5181884765625 	 kl mean: 0.053908638656139374 	 loss mean: 118.57209777832031


                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.53it/s]
 40%|████      | 4/10 [00:00<00:00, 10.93it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:22<00:01,  1.53it/s]
                                               [A
 92%|█████████▏| 35/38 [00:22<00:01,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.89it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.89it/s][A

nll mean: 118.4974365234375 	 kl mean: 0.053908638656139374 	 loss mean: 118.55134582519531
nll mean: 118.46407318115234 	 kl mean: 0.053908638656139374 	 loss mean: 118.51799011230469
nll mean: 118.55549621582031 	 kl mean: 0.053908638656139374 	 loss mean: 118.60940551757812


                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.53it/s]
                                               [A
 92%|█████████▏| 35/38 [00:22<00:01,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.89it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.85it/s][A
 95%|█████████▍| 36/38 [00:22<00:01,  1.36it/s]
                                               
 95%|█████████▍| 36/38 [00:22<00:01,  1.36it/s]
                                               
 95%|█████████▍| 36/38 [00:22<00:01,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.43528747558594 	 kl mean: 0.053908638656139374 	 loss mean: 118.48919677734375
nll mean: 118.57879638671875 	 kl mean: 0.053908638656139374 	 loss mean: 118.63270568847656
nll mean: 118.2215805053711 	 kl mean: 0.05541873723268509 	 loss mean: 118.2770004272461
nll mean: 118.20008087158203 	 kl mean: 0.05541873723268509 	 loss mean: 118.2554931640625


                                               
 95%|█████████▍| 36/38 [00:22<00:01,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:22<00:01,  1.36it/s]
                                               [A
 95%|█████████▍| 36/38 [00:22<00:01,  1.36it/s]
                                               [A
 95%|█████████▍| 36/38 [00:22<00:01,  1.36it/s]
 30%|███       | 3/10 [00:00<00:00, 24.23it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:22<00:01,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 23.81it/s][A

nll mean: 118.12406921386719 	 kl mean: 0.05541873723268509 	 loss mean: 118.17948913574219
nll mean: 118.20626831054688 	 kl mean: 0.05541873723268509 	 loss mean: 118.26168060302734
nll mean: 118.22342681884766 	 kl mean: 0.05541873723268509 	 loss mean: 118.27883911132812
nll mean: 118.1196060180664 	 kl mean: 0.05541873723268509 	 loss mean: 118.17503356933594
nll mean: 118.20101928710938 	 kl mean: 0.05541873723268509 	 loss mean: 118.25643157958984


                                               
 95%|█████████▍| 36/38 [00:22<00:01,  1.36it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 23.81it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.36it/s]
100%|██████████| 10/10 [00:00<00:00, 23.34it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.55it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.55it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.55it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.09834289550781 	 kl mean: 0.05541873723268509 	 loss mean: 118.15376281738281
nll mean: 118.17919921875 	 kl mean: 0.05541873723268509 	 loss mean: 118.234619140625
nll mean: 118.190673828125 	 kl mean: 0.05541873723268509 	 loss mean: 118.24609375
nll mean: 90.82568359375 	 kl mean: 0.047700222581624985 	 loss mean: 90.87339782714844
nll mean: 90.833251953125 	 kl mean: 0.047700222581624985 	 loss mean: 90.88096618652344
nll mean: 90.87284851074219 	 kl mean: 0.047700222581624985 	 loss mean: 90.92054748535156


                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:23<00:00,  1.55it/s]
                                               [A
 97%|█████████▋| 37/38 [00:23<00:00,  1.55it/s]
                                               [A
 97%|█████████▋| 37/38 [00:23<00:00,  1.55it/s]
                                               [A
 97%|█████████▋| 37/38 [00:23<00:00,  1.55it/s]
 40%|████      | 4/10 [00:00<00:00, 31.53it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:23<00:00,  1.55it/s]
                                               [A
 97%|█████████▋| 37/38 [00:23<00:00,  1.55it/s]
100%|██████████| 10/10 [00:00<00:00, 31.36it/s][A
100%|██████████| 38/38 [00:23<00:00,  1.62it/s]


nll mean: 90.90898132324219 	 kl mean: 0.047700222581624985 	 loss mean: 90.9566879272461
nll mean: 90.81423950195312 	 kl mean: 0.047700222581624985 	 loss mean: 90.86195373535156
nll mean: 90.79207611083984 	 kl mean: 0.047700222581624985 	 loss mean: 90.83977508544922
nll mean: 90.80802917480469 	 kl mean: 0.047700222581624985 	 loss mean: 90.85572814941406
nll mean: 90.80914306640625 	 kl mean: 0.047700222581624985 	 loss mean: 90.85685729980469
nll mean: 90.82313537597656 	 kl mean: 0.047700222581624985 	 loss mean: 90.87083435058594
nll mean: 90.91683959960938 	 kl mean: 0.047700222581624985 	 loss mean: 90.96453857421875
Approximate NLL:
tensor(126.9970, device='cuda:0')
Approximate KL:
tensor(0.0486, device='cuda:0')
Testing took 0:00:26.320260


  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .34it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .34it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .34it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 26.34it/s][A
 60%|██████    | 6/10 [00:00<00:00, 26.05it/s][A

nll mean: 116.2921142578125 	 kl mean: 0.04677597060799599 	 loss mean: 116.33889770507812
nll mean: 116.19692993164062 	 kl mean: 0.04677597060799599 	 loss mean: 116.24370574951172
nll mean: 116.31024169921875 	 kl mean: 0.04677597060799599 	 loss mean: 116.35701751708984
nll mean: 116.31375122070312 	 kl mean: 0.04677597060799599 	 loss mean: 116.36052703857422
nll mean: 116.31220245361328 	 kl mean: 0.04677597060799599 	 loss mean: 116.35897827148438
nll mean: 116.32537841796875 	 kl mean: 0.04677597060799599 	 loss mean: 116.37216186523438


                                      
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .05it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .05it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 26.05it/s][A
                                      .66it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 25.37it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 116.24285888671875 	 kl mean: 0.04677597060799599 	 loss mean: 116.28962707519531
nll mean: 116.32119750976562 	 kl mean: 0.04677597060799599 	 loss mean: 116.36798095703125
nll mean: 116.44027709960938 	 kl mean: 0.04677597060799599 	 loss mean: 116.48705291748047
nll mean: 116.26786041259766 	 kl mean: 0.04677597060799599 	 loss mean: 116.31463623046875
nll mean: 131.48898315429688 	 kl mean: 0.04498990252614021 	 loss mean: 131.5339813232422


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]
 20%|██        | 2/10 [00:00<00:00, 14.11it/s][A
                                              [A

nll mean: 131.51275634765625 	 kl mean: 0.04498990252614021 	 loss mean: 131.55775451660156
nll mean: 131.44515991210938 	 kl mean: 0.04498990252614021 	 loss mean: 131.49014282226562
nll mean: 131.35116577148438 	 kl mean: 0.04498990252614021 	 loss mean: 131.39614868164062



  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]
 40%|████      | 4/10 [00:00<00:00, 14.53it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]
                                              [A


nll mean: 131.44493103027344 	 kl mean: 0.04498990252614021 	 loss mean: 131.4899139404297
nll mean: 131.49005126953125 	 kl mean: 0.04498990252614021 	 loss mean: 131.5350341796875
nll mean: 131.44427490234375 	 kl mean: 0.04498990252614021 	 loss mean: 131.4892578125


  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.60it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.52it/s]
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.52it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.56it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.84it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.08it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.08it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 131.45579528808594 	 kl mean: 0.04498990252614021 	 loss mean: 131.50079345703125
nll mean: 131.4111328125 	 kl mean: 0.04498990252614021 	 loss mean: 131.45611572265625
nll mean: 131.5458221435547 	 kl mean: 0.04498990252614021 	 loss mean: 131.5908203125
nll mean: 105.23745727539062 	 kl mean: 0.051116373389959335 	 loss mean: 105.28857421875


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.08it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.08it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.08it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.08it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.08it/s]
 30%|███       | 3/10 [00:00<00:00, 25.93it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.08it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.79it/s][A

nll mean: 105.21452331542969 	 kl mean: 0.051116373389959335 	 loss mean: 105.26563262939453
nll mean: 105.14714050292969 	 kl mean: 0.051116373389959335 	 loss mean: 105.19825744628906
nll mean: 105.18849182128906 	 kl mean: 0.051116373389959335 	 loss mean: 105.2396011352539
nll mean: 105.29627227783203 	 kl mean: 0.051116373389959335 	 loss mean: 105.3473892211914
nll mean: 105.20787811279297 	 kl mean: 0.051116373389959335 	 loss mean: 105.25898742675781
nll mean: 105.24127960205078 	 kl mean: 0.051116373389959335 	 loss mean: 105.29239654541016


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.08it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.08it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.79it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.08it/s]
100%|██████████| 10/10 [00:00<00:00, 25.64it/s][A
  8%|▊         | 3/38 [00:01<00:15,  2.20it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:15,  2.20it/s]

nll mean: 105.32832336425781 	 kl mean: 0.051116373389959335 	 loss mean: 105.37944030761719
nll mean: 105.28395080566406 	 kl mean: 0.051116373389959335 	 loss mean: 105.33506774902344
nll mean: 105.29460144042969 	 kl mean: 0.051116373389959335 	 loss mean: 105.34571838378906
nll mean: 144.74246215820312 	 kl mean: 0.05574717000126839 	 loss mean: 144.79818725585938



                                              
  8%|▊         | 3/38 [00:01<00:15,  2.20it/s]
 20%|██        | 2/10 [00:00<00:00, 11.09it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:15,  2.20it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:15,  2.20it/s][A
 40%|████      | 4/10 [00:00<00:00, 11.12it/s][A

nll mean: 144.72421264648438 	 kl mean: 0.05574717000126839 	 loss mean: 144.77996826171875
nll mean: 144.713623046875 	 kl mean: 0.05574717000126839 	 loss mean: 144.76937866210938
nll mean: 144.6132354736328 	 kl mean: 0.05574717000126839 	 loss mean: 144.66897583007812



                                              
  8%|▊         | 3/38 [00:01<00:15,  2.20it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:15,  2.20it/s][A
 60%|██████    | 6/10 [00:00<00:00, 11.12it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:15,  2.20it/s][A

nll mean: 144.77008056640625 	 kl mean: 0.05574717000126839 	 loss mean: 144.8258056640625
nll mean: 144.84188842773438 	 kl mean: 0.05574717000126839 	 loss mean: 144.8976287841797
nll mean: 144.73446655273438 	 kl mean: 0.05574717000126839 	 loss mean: 144.79022216796875



                                              
  8%|▊         | 3/38 [00:02<00:15,  2.20it/s][A
 80%|████████  | 8/10 [00:00<00:00, 11.10it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:15,  2.20it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:15,  2.20it/s][A
100%|██████████| 10/10 [00:00<00:00, 11.10it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 144.743896484375 	 kl mean: 0.05574717000126839 	 loss mean: 144.7996368408203
nll mean: 144.67355346679688 	 kl mean: 0.05574717000126839 	 loss mean: 144.7292938232422
nll mean: 144.751708984375 	 kl mean: 0.05574717000126839 	 loss mean: 144.80746459960938



                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s]
 20%|██        | 2/10 [00:00<00:00, 14.51it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s][A

nll mean: 131.43138122558594 	 kl mean: 0.04855237901210785 	 loss mean: 131.4799346923828
nll mean: 131.53236389160156 	 kl mean: 0.04855237901210785 	 loss mean: 131.58091735839844
nll mean: 131.46951293945312 	 kl mean: 0.04855237901210785 	 loss mean: 131.51806640625



                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.39it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.42it/s][A

nll mean: 131.40782165527344 	 kl mean: 0.04855237901210785 	 loss mean: 131.45639038085938
nll mean: 131.41818237304688 	 kl mean: 0.04855237901210785 	 loss mean: 131.46673583984375
nll mean: 131.48880004882812 	 kl mean: 0.04855237901210785 	 loss mean: 131.537353515625



                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.39it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.70it/s][A

nll mean: 131.48883056640625 	 kl mean: 0.04855237901210785 	 loss mean: 131.53738403320312
nll mean: 131.40966796875 	 kl mean: 0.04855237901210785 	 loss mean: 131.4582061767578
nll mean: 131.40594482421875 	 kl mean: 0.04855237901210785 	 loss mean: 131.45449829101562



                                              
 11%|█         | 4/38 [00:03<00:20,  1.70it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.37it/s][A
 13%|█▎        | 5/38 [00:03<00:20,  1.61it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.61it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 15.41it/s][A

nll mean: 131.41497802734375 	 kl mean: 0.04855237901210785 	 loss mean: 131.46353149414062
nll mean: 129.46124267578125 	 kl mean: 0.04237170144915581 	 loss mean: 129.50360107421875
nll mean: 129.533203125 	 kl mean: 0.04237170144915581 	 loss mean: 129.57557678222656


                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.61it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 15.41it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.61it/s]
 40%|████      | 4/10 [00:00<00:00, 15.08it/s][A

nll mean: 129.4718017578125 	 kl mean: 0.04237170144915581 	 loss mean: 129.51417541503906
nll mean: 129.39891052246094 	 kl mean: 0.04237170144915581 	 loss mean: 129.4412841796875
nll mean: 129.55711364746094 	 kl mean: 0.04237170144915581 	 loss mean: 129.5994873046875


                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.61it/s]
 40%|████      | 4/10 [00:00<00:00, 15.08it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.61it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.61it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.81it/s][A
                                              [A


nll mean: 129.47467041015625 	 kl mean: 0.04237170144915581 	 loss mean: 129.5170440673828
nll mean: 129.53213500976562 	 kl mean: 0.04237170144915581 	 loss mean: 129.5745086669922
nll mean: 129.5431365966797 	 kl mean: 0.04237170144915581 	 loss mean: 129.58551025390625


 13%|█▎        | 5/38 [00:03<00:20,  1.61it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.81it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.89it/s][A
 16%|█▌        | 6/38 [00:03<00:20,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.57it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.57it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.57it/s]
 30%|███       | 3/10 [00:00<00:00, 25.90it/s][A

nll mean: 129.39462280273438 	 kl mean: 0.04237170144915581 	 loss mean: 129.43698120117188
nll mean: 129.558349609375 	 kl mean: 0.04237170144915581 	 loss mean: 129.6007080078125
nll mean: 138.9402618408203 	 kl mean: 0.03907628357410431 	 loss mean: 138.97933959960938
nll mean: 138.9283447265625 	 kl mean: 0.03907628357410431 	 loss mean: 138.96742248535156
nll mean: 138.95236206054688 	 kl mean: 0.03907628357410431 	 loss mean: 138.99142456054688



                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.57it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.57it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.57it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.58it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.57it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.57it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.57it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.53it/s][A

nll mean: 138.96925354003906 	 kl mean: 0.03907628357410431 	 loss mean: 139.00833129882812
nll mean: 138.97315979003906 	 kl mean: 0.03907628357410431 	 loss mean: 139.01223754882812
nll mean: 139.03057861328125 	 kl mean: 0.03907628357410431 	 loss mean: 139.06964111328125
nll mean: 138.9681396484375 	 kl mean: 0.03907628357410431 	 loss mean: 139.0072021484375
nll mean: 139.044189453125 	 kl mean: 0.03907628357410431 	 loss mean: 139.083251953125
nll mean: 139.04696655273438 	 kl mean: 0.03907628357410431 	 loss mean: 139.08604431152344



                                              
100%|██████████| 10/10 [00:00<00:00, 25.36it/s][A
 18%|█▊        | 7/38 [00:04<00:17,  1.77it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.77it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.77it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.77it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.77it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.77it/s]
 30%|███       | 3/10 [00:00<00:00, 25.52it/s][A

nll mean: 138.97366333007812 	 kl mean: 0.03907628357410431 	 loss mean: 139.01275634765625
nll mean: 112.22024536132812 	 kl mean: 0.048479922115802765 	 loss mean: 112.26873016357422
nll mean: 112.24431610107422 	 kl mean: 0.048479922115802765 	 loss mean: 112.29280090332031
nll mean: 112.21377563476562 	 kl mean: 0.048479922115802765 	 loss mean: 112.26225280761719
nll mean: 112.16818237304688 	 kl mean: 0.048479922115802765 	 loss mean: 112.21666717529297
nll mean: 112.23698425292969 	 kl mean: 0.048479922115802765 	 loss mean: 112.28546142578125


                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.77it/s]
 30%|███       | 3/10 [00:00<00:00, 25.52it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.77it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.77it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.77it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.51it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.77it/s]
100%|██████████| 10/10 [00:00<00:00, 25.51it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.95it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 112.29957580566406 	 kl mean: 0.048479922115802765 	 loss mean: 112.34805297851562
nll mean: 112.17391967773438 	 kl mean: 0.048479922115802765 	 loss mean: 112.22239685058594
nll mean: 112.17137145996094 	 kl mean: 0.048479922115802765 	 loss mean: 112.21985626220703
nll mean: 112.3065414428711 	 kl mean: 0.048479922115802765 	 loss mean: 112.35501098632812
nll mean: 112.22592163085938 	 kl mean: 0.048479922115802765 	 loss mean: 112.27439880371094



                                              
 21%|██        | 8/38 [00:04<00:15,  1.95it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.95it/s]
 20%|██        | 2/10 [00:00<00:00, 15.45it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.95it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.95it/s][A
 40%|████      | 4/10 [00:00<00:00, 15.51it/s][A

nll mean: 137.9402618408203 	 kl mean: 0.04216358810663223 	 loss mean: 137.982421875
nll mean: 138.01873779296875 	 kl mean: 0.04216358810663223 	 loss mean: 138.06089782714844
nll mean: 137.93267822265625 	 kl mean: 0.04216358810663223 	 loss mean: 137.97483825683594
nll mean: 137.9566650390625 	 kl mean: 0.04216358810663223 	 loss mean: 137.9988250732422



                                              
 21%|██        | 8/38 [00:04<00:15,  1.95it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.95it/s][A
 60%|██████    | 6/10 [00:00<00:00, 15.67it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.95it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.95it/s][A
 80%|████████  | 8/10 [00:00<00:00, 15.82it/s][A

nll mean: 137.94268798828125 	 kl mean: 0.04216358810663223 	 loss mean: 137.98486328125
nll mean: 137.9305419921875 	 kl mean: 0.04216358810663223 	 loss mean: 137.9727020263672
nll mean: 137.91238403320312 	 kl mean: 0.04216358810663223 	 loss mean: 137.95455932617188
nll mean: 137.93704223632812 	 kl mean: 0.04216358810663223 	 loss mean: 137.97921752929688



                                              
 21%|██        | 8/38 [00:05<00:15,  1.95it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.95it/s][A
100%|██████████| 10/10 [00:00<00:00, 15.59it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.81it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.81it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.81it/s]

nll mean: 137.95556640625 	 kl mean: 0.04216358810663223 	 loss mean: 137.99771118164062
nll mean: 137.9733123779297 	 kl mean: 0.04216358810663223 	 loss mean: 138.01547241210938
nll mean: 136.77357482910156 	 kl mean: 0.04301464557647705 	 loss mean: 136.81658935546875
nll mean: 136.8630828857422 	 kl mean: 0.04301464557647705 	 loss mean: 136.90609741210938



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.81it/s]
 30%|███       | 3/10 [00:00<00:00, 22.53it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.81it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.81it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.81it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.49it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.81it/s][A

nll mean: 136.74566650390625 	 kl mean: 0.04301464557647705 	 loss mean: 136.7886962890625
nll mean: 136.80917358398438 	 kl mean: 0.04301464557647705 	 loss mean: 136.85220336914062
nll mean: 136.84051513671875 	 kl mean: 0.04301464557647705 	 loss mean: 136.88352966308594
nll mean: 136.83871459960938 	 kl mean: 0.04301464557647705 	 loss mean: 136.8817138671875
nll mean: 136.78160095214844 	 kl mean: 0.04301464557647705 	 loss mean: 136.82460021972656



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.81it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.81it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.43it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 22.25it/s][A
 26%|██▋       | 10/38 [00:05<00:14,  1.91it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.91it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.91it/s]

nll mean: 136.78443908691406 	 kl mean: 0.04301464557647705 	 loss mean: 136.82745361328125
nll mean: 136.7828369140625 	 kl mean: 0.04301464557647705 	 loss mean: 136.8258514404297
nll mean: 136.80369567871094 	 kl mean: 0.04301464557647705 	 loss mean: 136.84671020507812
nll mean: 123.67607116699219 	 kl mean: 0.039846353232860565 	 loss mean: 123.71591186523438
nll mean: 123.68087005615234 	 kl mean: 0.039846353232860565 	 loss mean: 123.72071838378906



                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.91it/s]
 30%|███       | 3/10 [00:00<00:00, 25.27it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.91it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.91it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.91it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.33it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.91it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.91it/s][A

nll mean: 123.73348999023438 	 kl mean: 0.039846353232860565 	 loss mean: 123.77333068847656
nll mean: 123.58706665039062 	 kl mean: 0.039846353232860565 	 loss mean: 123.62691497802734
nll mean: 123.65126037597656 	 kl mean: 0.039846353232860565 	 loss mean: 123.69110107421875
nll mean: 123.63200378417969 	 kl mean: 0.039846353232860565 	 loss mean: 123.67184448242188
nll mean: 123.68761444091797 	 kl mean: 0.039846353232860565 	 loss mean: 123.72746276855469
nll mean: 123.7626953125 	 kl mean: 0.039846353232860565 	 loss mean: 123.80254364013672



                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.91it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.34it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.32it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  2.06it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.06it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.06it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.06it/s]
 30%|███       | 3/10 [00:00<00:00, 22.14it/s][A

nll mean: 123.7201156616211 	 kl mean: 0.039846353232860565 	 loss mean: 123.75996398925781
nll mean: 123.7448959350586 	 kl mean: 0.039846353232860565 	 loss mean: 123.78473663330078
nll mean: 147.22531127929688 	 kl mean: 0.047599487006664276 	 loss mean: 147.27291870117188
nll mean: 147.14979553222656 	 kl mean: 0.047599487006664276 	 loss mean: 147.1973876953125
nll mean: 147.14337158203125 	 kl mean: 0.047599487006664276 	 loss mean: 147.19097900390625



                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.06it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.06it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.06it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.04it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.06it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.06it/s][A

nll mean: 147.1212158203125 	 kl mean: 0.047599487006664276 	 loss mean: 147.16880798339844
nll mean: 147.19361877441406 	 kl mean: 0.047599487006664276 	 loss mean: 147.2412109375
nll mean: 147.18551635742188 	 kl mean: 0.047599487006664276 	 loss mean: 147.23312377929688
nll mean: 147.15936279296875 	 kl mean: 0.047599487006664276 	 loss mean: 147.20697021484375
nll mean: 147.2075958251953 	 kl mean: 0.047599487006664276 	 loss mean: 147.2552032470703



                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.06it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.22it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 22.12it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.10it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.10it/s]

nll mean: 147.1593017578125 	 kl mean: 0.047599487006664276 	 loss mean: 147.2069091796875
nll mean: 147.1337890625 	 kl mean: 0.047599487006664276 	 loss mean: 147.181396484375
nll mean: 125.43991088867188 	 kl mean: 0.04081382229924202 	 loss mean: 125.48072814941406



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.10it/s]
 20%|██        | 2/10 [00:00<00:00, 12.89it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.10it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.10it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.94it/s][A

nll mean: 125.49612426757812 	 kl mean: 0.04081382229924202 	 loss mean: 125.53692626953125
nll mean: 125.49314880371094 	 kl mean: 0.04081382229924202 	 loss mean: 125.53396606445312
nll mean: 125.42286682128906 	 kl mean: 0.04081382229924202 	 loss mean: 125.46368408203125



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.10it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.10it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.04it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.10it/s][A

nll mean: 125.54792785644531 	 kl mean: 0.04081382229924202 	 loss mean: 125.58872985839844
nll mean: 125.52323913574219 	 kl mean: 0.04081382229924202 	 loss mean: 125.5640640258789
nll mean: 125.40926361083984 	 kl mean: 0.04081382229924202 	 loss mean: 125.45008087158203



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.10it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.99it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.10it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.10it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.02it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.77it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 125.41677856445312 	 kl mean: 0.04081382229924202 	 loss mean: 125.45758056640625
nll mean: 125.46803283691406 	 kl mean: 0.04081382229924202 	 loss mean: 125.50885009765625
nll mean: 125.4141616821289 	 kl mean: 0.04081382229924202 	 loss mean: 125.4549789428711


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.77it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.77it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
[A                                           

nll mean: 168.47825622558594 	 kl mean: 0.050489865243434906 	 loss mean: 168.52874755859375
nll mean: 168.46881103515625 	 kl mean: 0.050489865243434906 	 loss mean: 168.51930236816406


 34%|███▍      | 13/38 [00:07<00:14,  1.77it/s]
 20%|██        | 2/10 [00:00<00:00, 10.23it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.77it/s]
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.77it/s]
 30%|███       | 3/10 [00:00<00:00, 10.15it/s][A


nll mean: 168.52537536621094 	 kl mean: 0.050489865243434906 	 loss mean: 168.5758514404297
nll mean: 168.5375518798828 	 kl mean: 0.050489865243434906 	 loss mean: 168.58804321289062
nll mean: 168.595947265625 	 kl mean: 0.050489865243434906 	 loss mean: 168.6464385986328


                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.77it/s]
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.77it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.13it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.77it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.19it/s][A

nll mean: 168.54107666015625 	 kl mean: 0.050489865243434906 	 loss mean: 168.591552734375
nll mean: 168.51358032226562 	 kl mean: 0.050489865243434906 	 loss mean: 168.56405639648438
nll mean: 168.57801818847656 	 kl mean: 0.050489865243434906 	 loss mean: 168.62850952148438


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.77it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.19it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.77it/s]
100%|██████████| 10/10 [00:00<00:00, 10.18it/s][A
 37%|███▋      | 14/38 [00:08<00:16,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.45it/s]

nll mean: 168.44451904296875 	 kl mean: 0.050489865243434906 	 loss mean: 168.49501037597656
nll mean: 168.48135375976562 	 kl mean: 0.050489865243434906 	 loss mean: 168.53182983398438
nll mean: 140.58572387695312 	 kl mean: 0.046792253851890564 	 loss mean: 140.63250732421875



                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.45it/s]
 20%|██        | 2/10 [00:00<00:00, 18.54it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.45it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.45it/s][A
 40%|████      | 4/10 [00:00<00:00, 18.43it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.45it/s][A

nll mean: 140.78692626953125 	 kl mean: 0.046792253851890564 	 loss mean: 140.83370971679688
nll mean: 140.68963623046875 	 kl mean: 0.046792253851890564 	 loss mean: 140.73641967773438
nll mean: 140.58888244628906 	 kl mean: 0.046792253851890564 	 loss mean: 140.63568115234375
nll mean: 140.6046142578125 	 kl mean: 0.046792253851890564 	 loss mean: 140.65139770507812



                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.45it/s][A
 60%|██████    | 6/10 [00:00<00:00, 18.40it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.45it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.45it/s][A
 80%|████████  | 8/10 [00:00<00:00, 18.43it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.45it/s][A

nll mean: 140.6473846435547 	 kl mean: 0.046792253851890564 	 loss mean: 140.69418334960938
nll mean: 140.66944885253906 	 kl mean: 0.046792253851890564 	 loss mean: 140.71624755859375
nll mean: 140.5372314453125 	 kl mean: 0.046792253851890564 	 loss mean: 140.58401489257812
nll mean: 140.60523986816406 	 kl mean: 0.046792253851890564 	 loss mean: 140.65203857421875



                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.45it/s][A
100%|██████████| 10/10 [00:00<00:00, 18.39it/s][A
 39%|███▉      | 15/38 [00:08<00:14,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 39%|███▉      | 15/38 [00:08<00:14,  1.55it/s]
                                               
 39%|███▉      | 15/38 [00:08<00:14,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 11.04it/s][A

nll mean: 140.61961364746094 	 kl mean: 0.046792253851890564 	 loss mean: 140.66639709472656
nll mean: 150.04515075683594 	 kl mean: 0.043636731803417206 	 loss mean: 150.0887908935547
nll mean: 149.98974609375 	 kl mean: 0.043636731803417206 	 loss mean: 150.03338623046875



                                               
 39%|███▉      | 15/38 [00:09<00:14,  1.55it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:14,  1.55it/s][A
 40%|████      | 4/10 [00:00<00:00, 11.06it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:14,  1.55it/s][A

nll mean: 150.10800170898438 	 kl mean: 0.043636731803417206 	 loss mean: 150.15162658691406
nll mean: 149.98312377929688 	 kl mean: 0.043636731803417206 	 loss mean: 150.02676391601562
nll mean: 150.10556030273438 	 kl mean: 0.043636731803417206 	 loss mean: 150.14918518066406



                                               
 39%|███▉      | 15/38 [00:09<00:14,  1.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 11.04it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:14,  1.55it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:14,  1.55it/s][A
 80%|████████  | 8/10 [00:00<00:00, 11.04it/s][A

nll mean: 150.04736328125 	 kl mean: 0.043636731803417206 	 loss mean: 150.09100341796875
nll mean: 150.0498046875 	 kl mean: 0.043636731803417206 	 loss mean: 150.09344482421875
nll mean: 149.99237060546875 	 kl mean: 0.043636731803417206 	 loss mean: 150.03602600097656



                                               
 39%|███▉      | 15/38 [00:09<00:14,  1.55it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:14,  1.55it/s][A
100%|██████████| 10/10 [00:00<00:00, 11.00it/s][A
 42%|████▏     | 16/38 [00:09<00:15,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 42%|████▏     | 16/38 [00:09<00:15,  1.38it/s]
                                               
 42%|████▏     | 16/38 [00:09<00:15,  1.38it/s]

nll mean: 150.07943725585938 	 kl mean: 0.043636731803417206 	 loss mean: 150.1230926513672
nll mean: 149.9764862060547 	 kl mean: 0.043636731803417206 	 loss mean: 150.02011108398438
nll mean: 150.6346435546875 	 kl mean: 0.0529838502407074 	 loss mean: 150.68763732910156
nll mean: 150.6168975830078 	 kl mean: 0.0529838502407074 	 loss mean: 150.6698760986328



                                               
 42%|████▏     | 16/38 [00:09<00:15,  1.38it/s]
 30%|███       | 3/10 [00:00<00:00, 25.17it/s][A
                                               
 42%|████▏     | 16/38 [00:09<00:15,  1.38it/s][A
                                               
 42%|████▏     | 16/38 [00:09<00:15,  1.38it/s][A
                                               
 42%|████▏     | 16/38 [00:09<00:15,  1.38it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.22it/s][A
                                               
 42%|████▏     | 16/38 [00:09<00:15,  1.38it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:15,  1.38it/s][A

nll mean: 150.65386962890625 	 kl mean: 0.0529838502407074 	 loss mean: 150.7068634033203
nll mean: 150.6378173828125 	 kl mean: 0.0529838502407074 	 loss mean: 150.6907958984375
nll mean: 150.62100219726562 	 kl mean: 0.0529838502407074 	 loss mean: 150.67398071289062
nll mean: 150.59298706054688 	 kl mean: 0.0529838502407074 	 loss mean: 150.64596557617188
nll mean: 150.6192626953125 	 kl mean: 0.0529838502407074 	 loss mean: 150.6722412109375
nll mean: 150.64234924316406 	 kl mean: 0.0529838502407074 	 loss mean: 150.69534301757812



                                               
 42%|████▏     | 16/38 [00:10<00:15,  1.38it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.97it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 24.97it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.59it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.59it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 25.63it/s][A
                                               
 30%|███       | 3/10 [00:00<00:00, 25.63it/s]

nll mean: 150.64935302734375 	 kl mean: 0.0529838502407074 	 loss mean: 150.70233154296875
nll mean: 150.68287658691406 	 kl mean: 0.0529838502407074 	 loss mean: 150.73583984375
nll mean: 139.4163818359375 	 kl mean: 0.0411556214094162 	 loss mean: 139.45751953125
nll mean: 139.40328979492188 	 kl mean: 0.0411556214094162 	 loss mean: 139.44444274902344
nll mean: 139.48609924316406 	 kl mean: 0.0411556214094162 	 loss mean: 139.52725219726562
nll mean: 139.44833374023438 	 kl mean: 0.0411556214094162 	 loss mean: 139.48948669433594


 45%|████▍     | 17/38 [00:10<00:13,  1.59it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.59it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.59it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.50it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.59it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.59it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.59it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.31it/s][A
                                               


nll mean: 139.45526123046875 	 kl mean: 0.0411556214094162 	 loss mean: 139.49639892578125
nll mean: 139.37411499023438 	 kl mean: 0.0411556214094162 	 loss mean: 139.41525268554688
nll mean: 139.5150146484375 	 kl mean: 0.0411556214094162 	 loss mean: 139.55615234375
nll mean: 139.4080352783203 	 kl mean: 0.0411556214094162 	 loss mean: 139.44918823242188
nll mean: 139.4109649658203 	 kl mean: 0.0411556214094162 	 loss mean: 139.45211791992188
nll mean: 139.43850708007812 	 kl mean: 0.0411556214094162 	 loss mean: 139.47967529296875


100%|██████████| 10/10 [00:00<00:00, 25.16it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.78it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.78it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.78it/s]
 20%|██        | 2/10 [00:00<00:00, 12.93it/s][A
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.78it/s][A

nll mean: 137.32176208496094 	 kl mean: 0.04436784237623215 	 loss mean: 137.3661346435547
nll mean: 137.2832794189453 	 kl mean: 0.04436784237623215 	 loss mean: 137.32765197753906
nll mean: 137.33010864257812 	 kl mean: 0.04436784237623215 	 loss mean: 137.37448120117188



                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.78it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.92it/s][A
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.78it/s][A
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.78it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.96it/s][A

nll mean: 137.27792358398438 	 kl mean: 0.04436784237623215 	 loss mean: 137.3223114013672
nll mean: 137.27099609375 	 kl mean: 0.04436784237623215 	 loss mean: 137.31536865234375
nll mean: 137.283935546875 	 kl mean: 0.04436784237623215 	 loss mean: 137.3282928466797



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.78it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.78it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.02it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.78it/s][A

nll mean: 137.3235321044922 	 kl mean: 0.04436784237623215 	 loss mean: 137.36788940429688
nll mean: 137.27301025390625 	 kl mean: 0.04436784237623215 	 loss mean: 137.3173828125
nll mean: 137.29666137695312 	 kl mean: 0.04436784237623215 	 loss mean: 137.34103393554688



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.78it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.96it/s][A
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s]
 20%|██        | 2/10 [00:00<00:00, 13.26it/s][A

nll mean: 137.33946228027344 	 kl mean: 0.04436784237623215 	 loss mean: 137.3838348388672
nll mean: 152.17001342773438 	 kl mean: 0.0416901595890522 	 loss mean: 152.21170043945312
nll mean: 152.26197814941406 	 kl mean: 0.0416901595890522 	 loss mean: 152.30368041992188



                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.19it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s][A

nll mean: 152.23760986328125 	 kl mean: 0.0416901595890522 	 loss mean: 152.279296875
nll mean: 152.22312927246094 	 kl mean: 0.0416901595890522 	 loss mean: 152.26483154296875
nll mean: 152.13217163085938 	 kl mean: 0.0416901595890522 	 loss mean: 152.1738739013672



                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.18it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.07it/s][A

nll mean: 152.19688415527344 	 kl mean: 0.0416901595890522 	 loss mean: 152.2385711669922
nll mean: 152.11105346679688 	 kl mean: 0.0416901595890522 	 loss mean: 152.15274047851562
nll mean: 152.1277618408203 	 kl mean: 0.0416901595890522 	 loss mean: 152.16946411132812



                                               
 50%|█████     | 19/38 [00:11<00:11,  1.60it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:11,  1.60it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.01it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.50it/s]

nll mean: 152.24598693847656 	 kl mean: 0.0416901595890522 	 loss mean: 152.28768920898438
nll mean: 152.109130859375 	 kl mean: 0.0416901595890522 	 loss mean: 152.1508331298828
nll mean: 161.4036865234375 	 kl mean: 0.04471147805452347 	 loss mean: 161.44839477539062



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.50it/s]
 20%|██        | 2/10 [00:00<00:00, 13.20it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.50it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.50it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.17it/s][A

nll mean: 161.4883270263672 	 kl mean: 0.04471147805452347 	 loss mean: 161.5330352783203
nll mean: 161.41372680664062 	 kl mean: 0.04471147805452347 	 loss mean: 161.45843505859375
nll mean: 161.47467041015625 	 kl mean: 0.04471147805452347 	 loss mean: 161.5193634033203



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.50it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.50it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.02it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.50it/s][A

nll mean: 161.41493225097656 	 kl mean: 0.04471147805452347 	 loss mean: 161.4596405029297
nll mean: 161.4481658935547 	 kl mean: 0.04471147805452347 	 loss mean: 161.49285888671875
nll mean: 161.36834716796875 	 kl mean: 0.04471147805452347 	 loss mean: 161.41305541992188



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.50it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.78it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.50it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.50it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.85it/s][A
 55%|█████▌    | 21/38 [00:12<00:11,  1.42it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 161.41180419921875 	 kl mean: 0.04471147805452347 	 loss mean: 161.45651245117188
nll mean: 161.39707946777344 	 kl mean: 0.04471147805452347 	 loss mean: 161.4417724609375
nll mean: 161.4417724609375 	 kl mean: 0.04471147805452347 	 loss mean: 161.48648071289062


                                               
 55%|█████▌    | 21/38 [00:12<00:11,  1.42it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
 20%|██        | 2/10 [00:00<00:00, 10.45it/s][A

nll mean: 122.5652084350586 	 kl mean: 0.0480264276266098 	 loss mean: 122.61323547363281
nll mean: 122.52471160888672 	 kl mean: 0.0480264276266098 	 loss mean: 122.57273864746094
nll mean: 122.51463317871094 	 kl mean: 0.0480264276266098 	 loss mean: 122.56265258789062


                                               
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
 20%|██        | 2/10 [00:00<00:00, 10.45it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
 40%|████      | 4/10 [00:00<00:00, 10.47it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.49it/s][A

nll mean: 122.47826385498047 	 kl mean: 0.0480264276266098 	 loss mean: 122.52629089355469
nll mean: 122.48751068115234 	 kl mean: 0.0480264276266098 	 loss mean: 122.53553009033203
nll mean: 122.55816650390625 	 kl mean: 0.0480264276266098 	 loss mean: 122.60619354248047


                                               
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.49it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.41it/s][A

nll mean: 122.567138671875 	 kl mean: 0.0480264276266098 	 loss mean: 122.61517333984375
nll mean: 122.54983520507812 	 kl mean: 0.0480264276266098 	 loss mean: 122.59786224365234
nll mean: 122.62936401367188 	 kl mean: 0.0480264276266098 	 loss mean: 122.6773910522461


                                               
 55%|█████▌    | 21/38 [00:13<00:11,  1.42it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.41it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.39it/s][A
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               [A
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
 40%|████      | 4/10 [00:00<00:00, 34.37it/s][A

nll mean: 122.50606536865234 	 kl mean: 0.0480264276266098 	 loss mean: 122.55409240722656
nll mean: 112.21046447753906 	 kl mean: 0.036267951130867004 	 loss mean: 112.24673461914062
nll mean: 112.23857879638672 	 kl mean: 0.036267951130867004 	 loss mean: 112.27485656738281
nll mean: 112.22537231445312 	 kl mean: 0.036267951130867004 	 loss mean: 112.26164245605469
nll mean: 112.26828002929688 	 kl mean: 0.036267951130867004 	 loss mean: 112.30455017089844
nll mean: 112.28787994384766 	 kl mean: 0.036267951130867004 	 loss mean: 112.32414245605469
nll mean: 112.15301513671875 	 kl mean: 0.036267951130867004 	 loss mean: 112.18928527832031


                                               
 58%|█████▊    | 22/38 [00:13<00:12,  1.28it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.28it/s]
 40%|████      | 4/10 [00:00<00:00, 34.37it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.28it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.28it/s]
100%|██████████| 10/10 [00:00<00:00, 33.67it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]

nll mean: 112.26629638671875 	 kl mean: 0.036267951130867004 	 loss mean: 112.30256652832031
nll mean: 112.24635314941406 	 kl mean: 0.036267951130867004 	 loss mean: 112.28262329101562
nll mean: 112.17364501953125 	 kl mean: 0.036267951130867004 	 loss mean: 112.20991516113281
nll mean: 112.17366790771484 	 kl mean: 0.036267951130867004 	 loss mean: 112.20993041992188
nll mean: 163.03013610839844 	 kl mean: 0.044532760977745056 	 loss mean: 163.07467651367188



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 14.94it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.92it/s][A
[A                                           

nll mean: 163.00758361816406 	 kl mean: 0.044532760977745056 	 loss mean: 163.0521240234375
nll mean: 163.03680419921875 	 kl mean: 0.044532760977745056 	 loss mean: 163.08132934570312
nll mean: 162.94000244140625 	 kl mean: 0.044532760977745056 	 loss mean: 162.98452758789062


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.91it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s][A

nll mean: 163.05125427246094 	 kl mean: 0.044532760977745056 	 loss mean: 163.09579467773438
nll mean: 162.9761962890625 	 kl mean: 0.044532760977745056 	 loss mean: 163.02072143554688
nll mean: 163.1066436767578 	 kl mean: 0.044532760977745056 	 loss mean: 163.15118408203125



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.87it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.57it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.88it/s][A
 63%|██████▎   | 24/38 [00:14<00:09,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 63%|██████▎   | 24/38 [00:14<00:09,  1.54it/s]

nll mean: 162.93832397460938 	 kl mean: 0.044532760977745056 	 loss mean: 162.98284912109375
nll mean: 163.00238037109375 	 kl mean: 0.044532760977745056 	 loss mean: 163.04690551757812
nll mean: 163.05340576171875 	 kl mean: 0.044532760977745056 	 loss mean: 163.0979461669922
nll mean: 127.43235778808594 	 kl mean: 0.043581925332546234 	 loss mean: 127.47593688964844



                                               
 63%|██████▎   | 24/38 [00:14<00:09,  1.54it/s]
                                               
 63%|██████▎   | 24/38 [00:14<00:09,  1.54it/s]
 30%|███       | 3/10 [00:00<00:00, 22.91it/s][A
                                               
 63%|██████▎   | 24/38 [00:14<00:09,  1.54it/s][A
                                               
 63%|██████▎   | 24/38 [00:14<00:09,  1.54it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.54it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.73it/s][A

nll mean: 127.51980590820312 	 kl mean: 0.043581925332546234 	 loss mean: 127.56339263916016
nll mean: 127.49261474609375 	 kl mean: 0.043581925332546234 	 loss mean: 127.53619384765625
nll mean: 127.51732635498047 	 kl mean: 0.043581925332546234 	 loss mean: 127.5609130859375
nll mean: 127.49657440185547 	 kl mean: 0.043581925332546234 	 loss mean: 127.54015350341797
nll mean: 127.52625274658203 	 kl mean: 0.043581925332546234 	 loss mean: 127.56983184814453



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.54it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.54it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.54it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.46it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 22.31it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 127.44612121582031 	 kl mean: 0.043581925332546234 	 loss mean: 127.48970794677734
nll mean: 127.45735168457031 	 kl mean: 0.043581925332546234 	 loss mean: 127.50092315673828
nll mean: 127.58082580566406 	 kl mean: 0.043581925332546234 	 loss mean: 127.62440490722656
nll mean: 127.5435562133789 	 kl mean: 0.043581925332546234 	 loss mean: 127.5871353149414



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.70it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.70it/s]
 20%|██        | 2/10 [00:00<00:00, 14.29it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.70it/s][A

nll mean: 120.20415496826172 	 kl mean: 0.03838637098670006 	 loss mean: 120.24253845214844
nll mean: 120.20838165283203 	 kl mean: 0.03838637098670006 	 loss mean: 120.24676513671875
nll mean: 120.24687194824219 	 kl mean: 0.03838637098670006 	 loss mean: 120.28526306152344



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.70it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.42it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.70it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.70it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.51it/s][A

nll mean: 120.27051544189453 	 kl mean: 0.03838637098670006 	 loss mean: 120.30890655517578
nll mean: 120.15534210205078 	 kl mean: 0.03838637098670006 	 loss mean: 120.1937255859375
nll mean: 120.33621215820312 	 kl mean: 0.03838637098670006 	 loss mean: 120.37459564208984



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.70it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.70it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.54it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.70it/s][A

nll mean: 120.21854400634766 	 kl mean: 0.03838637098670006 	 loss mean: 120.25692749023438
nll mean: 120.24317932128906 	 kl mean: 0.03838637098670006 	 loss mean: 120.28157043457031
nll mean: 120.14275360107422 	 kl mean: 0.03838637098670006 	 loss mean: 120.18113708496094



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.70it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.56it/s][A
 68%|██████▊   | 26/38 [00:15<00:07,  1.62it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 68%|██████▊   | 26/38 [00:15<00:07,  1.62it/s]
                                               
 68%|██████▊   | 26/38 [00:15<00:07,  1.62it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s]
 30%|███       | 3/10 [00:00<00:00, 22.57it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A

nll mean: 120.18431091308594 	 kl mean: 0.03838637098670006 	 loss mean: 120.22270202636719
nll mean: 87.52556610107422 	 kl mean: 0.06931839883327484 	 loss mean: 87.59487915039062
nll mean: 87.53463745117188 	 kl mean: 0.06931839883327484 	 loss mean: 87.60395812988281
nll mean: 87.450927734375 	 kl mean: 0.06931839883327484 	 loss mean: 87.52024841308594
nll mean: 87.46179962158203 	 kl mean: 0.06931839883327484 	 loss mean: 87.53111267089844



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.90it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.50it/s][A

nll mean: 87.5660171508789 	 kl mean: 0.06931839883327484 	 loss mean: 87.63533020019531
nll mean: 87.54427337646484 	 kl mean: 0.06931839883327484 	 loss mean: 87.61359405517578
nll mean: 87.57933807373047 	 kl mean: 0.06931839883327484 	 loss mean: 87.6486587524414
nll mean: 87.51748657226562 	 kl mean: 0.06931839883327484 	 loss mean: 87.58680725097656
nll mean: 87.49516296386719 	 kl mean: 0.06931839883327484 	 loss mean: 87.56448364257812



                                               
100%|██████████| 10/10 [00:00<00:00, 22.69it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.77it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.77it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.77it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.77it/s]
 30%|███       | 3/10 [00:00<00:00, 21.85it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.77it/s][A

nll mean: 87.4969253540039 	 kl mean: 0.06931839883327484 	 loss mean: 87.56623840332031
nll mean: 114.80851745605469 	 kl mean: 0.04222520440816879 	 loss mean: 114.85073852539062
nll mean: 114.77399444580078 	 kl mean: 0.04222520440816879 	 loss mean: 114.81622314453125
nll mean: 114.78470611572266 	 kl mean: 0.04222520440816879 	 loss mean: 114.82693481445312
nll mean: 114.83029174804688 	 kl mean: 0.04222520440816879 	 loss mean: 114.87251281738281



                                               
 71%|███████   | 27/38 [00:16<00:06,  1.77it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.77it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.86it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.77it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.77it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.77it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.75it/s][A

nll mean: 114.77430725097656 	 kl mean: 0.04222520440816879 	 loss mean: 114.81654357910156
nll mean: 114.73698425292969 	 kl mean: 0.04222520440816879 	 loss mean: 114.77920532226562
nll mean: 114.85649871826172 	 kl mean: 0.04222520440816879 	 loss mean: 114.89871215820312
nll mean: 114.80372619628906 	 kl mean: 0.04222520440816879 	 loss mean: 114.845947265625
nll mean: 114.79510498046875 	 kl mean: 0.04222520440816879 	 loss mean: 114.83732604980469



                                               
100%|██████████| 10/10 [00:00<00:00, 21.69it/s][A
 74%|███████▎  | 28/38 [00:16<00:05,  1.87it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 74%|███████▎  | 28/38 [00:16<00:05,  1.87it/s]
                                               
 74%|███████▎  | 28/38 [00:16<00:05,  1.87it/s]
 20%|██        | 2/10 [00:00<00:00, 12.52it/s][A

nll mean: 114.7723159790039 	 kl mean: 0.04222520440816879 	 loss mean: 114.81454467773438
nll mean: 127.48888397216797 	 kl mean: 0.039602190256118774 	 loss mean: 127.52848815917969
nll mean: 127.40680694580078 	 kl mean: 0.039602190256118774 	 loss mean: 127.44640350341797



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.64it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A

nll mean: 127.42850494384766 	 kl mean: 0.039602190256118774 	 loss mean: 127.46810913085938
nll mean: 127.4067153930664 	 kl mean: 0.039602190256118774 	 loss mean: 127.4463119506836
nll mean: 127.3729248046875 	 kl mean: 0.039602190256118774 	 loss mean: 127.41252899169922



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.67it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A

nll mean: 127.41571044921875 	 kl mean: 0.039602190256118774 	 loss mean: 127.455322265625
nll mean: 127.42826843261719 	 kl mean: 0.039602190256118774 	 loss mean: 127.46786499023438
nll mean: 127.50692749023438 	 kl mean: 0.039602190256118774 	 loss mean: 127.54652404785156



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.54it/s][A
 76%|███████▋  | 29/38 [00:17<00:05,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 76%|███████▋  | 29/38 [00:17<00:05,  1.63it/s]

nll mean: 127.46327209472656 	 kl mean: 0.039602190256118774 	 loss mean: 127.50286102294922
nll mean: 127.3900146484375 	 kl mean: 0.039602190256118774 	 loss mean: 127.42961883544922
nll mean: 66.43656921386719 	 kl mean: 0.036557793617248535 	 loss mean: 66.4731216430664



                                               
 76%|███████▋  | 29/38 [00:17<00:05,  1.63it/s]
 20%|██        | 2/10 [00:00<00:00, 10.13it/s][A
                                               
 76%|███████▋  | 29/38 [00:17<00:05,  1.63it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.02it/s][A

nll mean: 66.49186706542969 	 kl mean: 0.036557793617248535 	 loss mean: 66.5284194946289
nll mean: 66.48604583740234 	 kl mean: 0.036557793617248535 	 loss mean: 66.52259826660156



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.92it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.98it/s]

nll mean: 66.38858032226562 	 kl mean: 0.036557793617248535 	 loss mean: 66.42513275146484
nll mean: 66.42710876464844 	 kl mean: 0.036557793617248535 	 loss mean: 66.46366882324219
nll mean: 66.45482635498047 	 kl mean: 0.036557793617248535 	 loss mean: 66.49138641357422


[A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.91it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 10.01it/s][A

nll mean: 66.51457214355469 	 kl mean: 0.036557793617248535 	 loss mean: 66.5511245727539
nll mean: 66.4937744140625 	 kl mean: 0.036557793617248535 	 loss mean: 66.53033447265625
nll mean: 66.48674011230469 	 kl mean: 0.036557793617248535 	 loss mean: 66.52330017089844



                                               
100%|██████████| 10/10 [00:00<00:00, 10.03it/s][A
 79%|███████▉  | 30/38 [00:18<00:05,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 79%|███████▉  | 30/38 [00:18<00:05,  1.37it/s]
                                               
 79%|███████▉  | 30/38 [00:18<00:05,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 13.38it/s][A

nll mean: 66.51434326171875 	 kl mean: 0.036557793617248535 	 loss mean: 66.5509033203125
nll mean: 110.34278106689453 	 kl mean: 0.055683597922325134 	 loss mean: 110.39846801757812
nll mean: 110.30475616455078 	 kl mean: 0.055683597922325134 	 loss mean: 110.36044311523438



                                               
 79%|███████▉  | 30/38 [00:18<00:05,  1.37it/s][A
                                               
 79%|███████▉  | 30/38 [00:18<00:05,  1.37it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.35it/s][A
                                               
 79%|███████▉  | 30/38 [00:18<00:05,  1.37it/s][A

nll mean: 110.33558654785156 	 kl mean: 0.055683597922325134 	 loss mean: 110.3912582397461
nll mean: 110.3687973022461 	 kl mean: 0.055683597922325134 	 loss mean: 110.42448425292969
nll mean: 110.30551147460938 	 kl mean: 0.055683597922325134 	 loss mean: 110.36119842529297



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.24it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.32it/s][A

nll mean: 110.29750061035156 	 kl mean: 0.055683597922325134 	 loss mean: 110.35317993164062
nll mean: 110.29142761230469 	 kl mean: 0.055683597922325134 	 loss mean: 110.34710693359375
nll mean: 110.32546997070312 	 kl mean: 0.055683597922325134 	 loss mean: 110.38114929199219



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.20it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]

nll mean: 110.27703857421875 	 kl mean: 0.055683597922325134 	 loss mean: 110.33271789550781
nll mean: 110.33244323730469 	 kl mean: 0.055683597922325134 	 loss mean: 110.38812255859375
nll mean: 142.62930297851562 	 kl mean: 0.05414373055100441 	 loss mean: 142.68344116210938



                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]
 20%|██        | 2/10 [00:00<00:00, 10.19it/s][A
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s][A
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.22it/s][A

nll mean: 142.5692901611328 	 kl mean: 0.05414373055100441 	 loss mean: 142.62342834472656
nll mean: 142.6677703857422 	 kl mean: 0.05414373055100441 	 loss mean: 142.72190856933594
nll mean: 142.52670288085938 	 kl mean: 0.05414373055100441 	 loss mean: 142.58084106445312



                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s][A
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.23it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A

nll mean: 142.6429443359375 	 kl mean: 0.05414373055100441 	 loss mean: 142.6970977783203
nll mean: 142.70657348632812 	 kl mean: 0.05414373055100441 	 loss mean: 142.7607421875
nll mean: 142.67446899414062 	 kl mean: 0.05414373055100441 	 loss mean: 142.72862243652344



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.17it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 10.11it/s][A
[A                                           

nll mean: 142.5909423828125 	 kl mean: 0.05414373055100441 	 loss mean: 142.64511108398438
nll mean: 142.59552001953125 	 kl mean: 0.05414373055100441 	 loss mean: 142.649658203125


                                               
100%|██████████| 10/10 [00:00<00:00, 10.15it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.23it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.23it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.23it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.23it/s]
 30%|███       | 3/10 [00:00<00:00, 26.57it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.23it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.23it/s][A

nll mean: 142.58267211914062 	 kl mean: 0.05414373055100441 	 loss mean: 142.63681030273438
nll mean: 67.959716796875 	 kl mean: 0.03106127306818962 	 loss mean: 67.99077606201172
nll mean: 67.93363952636719 	 kl mean: 0.03106127306818962 	 loss mean: 67.9646987915039
nll mean: 67.90213012695312 	 kl mean: 0.03106127306818962 	 loss mean: 67.93318939208984
nll mean: 67.98312377929688 	 kl mean: 0.03106127306818962 	 loss mean: 68.01419067382812
nll mean: 67.90121459960938 	 kl mean: 0.03106127306818962 	 loss mean: 67.93226623535156



                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.23it/s][A
 60%|██████    | 6/10 [00:00<00:00, 26.43it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.23it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.23it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.23it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 26.24it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 26.08it/s][A
 87%|████████▋ | 33/38 [00:20<00:03,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
[A                                   

nll mean: 67.85047149658203 	 kl mean: 0.03106127306818962 	 loss mean: 67.88153076171875
nll mean: 67.96891784667969 	 kl mean: 0.03106127306818962 	 loss mean: 67.9999771118164
nll mean: 67.84466552734375 	 kl mean: 0.03106127306818962 	 loss mean: 67.87572479248047
nll mean: 67.89496612548828 	 kl mean: 0.03106127306818962 	 loss mean: 67.926025390625
nll mean: 67.89295959472656 	 kl mean: 0.03106127306818962 	 loss mean: 67.92401885986328


                                               
 87%|████████▋ | 33/38 [00:20<00:03,  1.46it/s]
                                               
 87%|████████▋ | 33/38 [00:20<00:03,  1.46it/s]
                                               
 87%|████████▋ | 33/38 [00:20<00:03,  1.46it/s]
 30%|███       | 3/10 [00:00<00:00, 22.69it/s][A
                                               
 87%|████████▋ | 33/38 [00:20<00:03,  1.46it/s][A
                                               
 87%|████████▋ | 33/38 [00:20<00:03,  1.46it/s][A

nll mean: 123.44609069824219 	 kl mean: 0.04835260659456253 	 loss mean: 123.49443817138672
nll mean: 123.5110092163086 	 kl mean: 0.04835260659456253 	 loss mean: 123.55935668945312
nll mean: 123.45999908447266 	 kl mean: 0.04835260659456253 	 loss mean: 123.50835418701172
nll mean: 123.50897216796875 	 kl mean: 0.04835260659456253 	 loss mean: 123.55732727050781
nll mean: 123.52464294433594 	 kl mean: 0.04835260659456253 	 loss mean: 123.57299041748047



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.46it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.54it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.46it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.46it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.46it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.52it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 22.43it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 123.50640869140625 	 kl mean: 0.04835260659456253 	 loss mean: 123.55474853515625
nll mean: 123.5340347290039 	 kl mean: 0.04835260659456253 	 loss mean: 123.58238220214844
nll mean: 123.51307678222656 	 kl mean: 0.04835260659456253 	 loss mean: 123.56143188476562
nll mean: 123.53411865234375 	 kl mean: 0.04835260659456253 	 loss mean: 123.58247375488281
nll mean: 123.4496078491211 	 kl mean: 0.04835260659456253 	 loss mean: 123.49795532226562



                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.63it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.63it/s]
 20%|██        | 2/10 [00:00<00:00, 12.61it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.63it/s][A

nll mean: 126.56126403808594 	 kl mean: 0.03770046681165695 	 loss mean: 126.59896087646484
nll mean: 126.54972076416016 	 kl mean: 0.03770046681165695 	 loss mean: 126.58741760253906
nll mean: 126.50456237792969 	 kl mean: 0.03770046681165695 	 loss mean: 126.5422592163086



                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.63it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.61it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.63it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.63it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.78it/s][A

nll mean: 126.61254119873047 	 kl mean: 0.03770046681165695 	 loss mean: 126.65023803710938
nll mean: 126.52517700195312 	 kl mean: 0.03770046681165695 	 loss mean: 126.56287384033203
nll mean: 126.56922912597656 	 kl mean: 0.03770046681165695 	 loss mean: 126.60691833496094



                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.63it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.63it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.86it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.63it/s][A

nll mean: 126.45037078857422 	 kl mean: 0.03770046681165695 	 loss mean: 126.48808288574219
nll mean: 126.55694580078125 	 kl mean: 0.03770046681165695 	 loss mean: 126.59465026855469
nll mean: 126.52809143066406 	 kl mean: 0.03770046681165695 	 loss mean: 126.56580352783203



                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.63it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.85it/s][A
 92%|█████████▏| 35/38 [00:21<00:01,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.51it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.51it/s]
 20%|██        | 2/10 [00:00<00:00, 10.94it/s][A

nll mean: 126.51522827148438 	 kl mean: 0.03770046681165695 	 loss mean: 126.55293273925781
nll mean: 118.87355041503906 	 kl mean: 0.051761042326688766 	 loss mean: 118.92530822753906
nll mean: 118.93745422363281 	 kl mean: 0.051761042326688766 	 loss mean: 118.98921203613281



                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.51it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.51it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.89it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.51it/s][A

nll mean: 118.81578063964844 	 kl mean: 0.051761042326688766 	 loss mean: 118.86754608154297
nll mean: 118.88951110839844 	 kl mean: 0.051761042326688766 	 loss mean: 118.94126892089844
nll mean: 118.87635803222656 	 kl mean: 0.051761042326688766 	 loss mean: 118.92811584472656



                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.80it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.51it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.51it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.81it/s][A

nll mean: 118.85054016113281 	 kl mean: 0.051761042326688766 	 loss mean: 118.90229797363281
nll mean: 118.91021728515625 	 kl mean: 0.051761042326688766 	 loss mean: 118.96197509765625
nll mean: 118.83778381347656 	 kl mean: 0.051761042326688766 	 loss mean: 118.8895492553711



                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.51it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:01,  1.51it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.78it/s][A
 95%|█████████▍| 36/38 [00:22<00:01,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 95%|█████████▍| 36/38 [00:22<00:01,  1.34it/s]
                                               
 95%|█████████▍| 36/38 [00:22<00:01,  1.34it/s]

nll mean: 118.85302734375 	 kl mean: 0.051761042326688766 	 loss mean: 118.90478515625
nll mean: 118.81257629394531 	 kl mean: 0.051761042326688766 	 loss mean: 118.86434936523438
nll mean: 118.12623596191406 	 kl mean: 0.04853813350200653 	 loss mean: 118.17477416992188
nll mean: 118.10398864746094 	 kl mean: 0.04853813350200653 	 loss mean: 118.15252685546875



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 23.41it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.34it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.34it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.34it/s][A
 60%|██████    | 6/10 [00:00<00:00, 23.01it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.34it/s][A

nll mean: 118.05693054199219 	 kl mean: 0.04853813350200653 	 loss mean: 118.10546875
nll mean: 118.08021545410156 	 kl mean: 0.04853813350200653 	 loss mean: 118.12875366210938
nll mean: 118.0531997680664 	 kl mean: 0.04853813350200653 	 loss mean: 118.10174560546875
nll mean: 118.16830444335938 	 kl mean: 0.04853813350200653 	 loss mean: 118.21684265136719
nll mean: 118.15164184570312 	 kl mean: 0.04853813350200653 	 loss mean: 118.20018768310547



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.34it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.34it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.45it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 22.37it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.53it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.53it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.53it/s]

nll mean: 118.03636169433594 	 kl mean: 0.04853813350200653 	 loss mean: 118.08489990234375
nll mean: 118.15636444091797 	 kl mean: 0.04853813350200653 	 loss mean: 118.20490264892578
nll mean: 118.09777069091797 	 kl mean: 0.04853813350200653 	 loss mean: 118.14630126953125
nll mean: 91.55155944824219 	 kl mean: 0.03732893615961075 	 loss mean: 91.5888671875
nll mean: 91.51290130615234 	 kl mean: 0.03732893615961075 	 loss mean: 91.55023193359375
nll mean: 91.46627807617188 	 kl mean: 0.03732893615961075 	 loss mean: 91.50360107421875



                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.53it/s]
 40%|████      | 4/10 [00:00<00:00, 31.19it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.53it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.53it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.53it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.53it/s][A
 80%|████████  | 8/10 [00:00<00:00, 31.20it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.53it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 31.12it/s][A
100%|██████████| 38/38 [00:23<00:00,  1.61it/s]


nll mean: 91.511962890625 	 kl mean: 0.03732893615961075 	 loss mean: 91.54928588867188
nll mean: 91.52670288085938 	 kl mean: 0.03732893615961075 	 loss mean: 91.56402587890625
nll mean: 91.55327606201172 	 kl mean: 0.03732893615961075 	 loss mean: 91.5905990600586
nll mean: 91.45113372802734 	 kl mean: 0.03732893615961075 	 loss mean: 91.48845672607422
nll mean: 91.49592590332031 	 kl mean: 0.03732893615961075 	 loss mean: 91.53324890136719
nll mean: 91.4415512084961 	 kl mean: 0.03732893615961075 	 loss mean: 91.4788818359375
nll mean: 91.41719818115234 	 kl mean: 0.03732893615961075 	 loss mean: 91.45452880859375
Approximate NLL:
tensor(127.1339, device='cuda:0')
Approximate KL:
tensor(0.0453, device='cuda:0')
Testing took 0:00:24.654170


  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 26.18it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].18it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].18it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].18it/s][A

nll mean: 115.61343383789062 	 kl mean: 0.04841260612010956 	 loss mean: 115.66184997558594
nll mean: 115.56773376464844 	 kl mean: 0.04841260612010956 	 loss mean: 115.61614990234375
nll mean: 115.6533203125 	 kl mean: 0.04841260612010956 	 loss mean: 115.70172882080078
nll mean: 115.55978393554688 	 kl mean: 0.04841260612010956 	 loss mean: 115.60820007324219
nll mean: 115.63656616210938 	 kl mean: 0.04841260612010956 	 loss mean: 115.68497467041016
nll mean: 115.6214599609375 	 kl mean: 0.04841260612010956 	 loss mean: 115.66986846923828



 60%|██████    | 6/10 [00:00<00:00, 25.85it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].85it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].85it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].85it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.52it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 25.30it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]

nll mean: 115.60430908203125 	 kl mean: 0.04841260612010956 	 loss mean: 115.65272521972656
nll mean: 115.5488052368164 	 kl mean: 0.04841260612010956 	 loss mean: 115.59721374511719
nll mean: 115.67300415039062 	 kl mean: 0.04841260612010956 	 loss mean: 115.72142028808594
nll mean: 115.56175994873047 	 kl mean: 0.04841260612010956 	 loss mean: 115.61017608642578
nll mean: 131.80606079101562 	 kl mean: 0.05553772300481796 	 loss mean: 131.86160278320312



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s]
 20%|██        | 2/10 [00:00<00:00, 14.21it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.14it/s][A

nll mean: 131.8188018798828 	 kl mean: 0.05553772300481796 	 loss mean: 131.8743438720703
nll mean: 131.8060302734375 	 kl mean: 0.05553772300481796 	 loss mean: 131.861572265625
nll mean: 131.7678680419922 	 kl mean: 0.05553772300481796 	 loss mean: 131.82339477539062



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.43it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s][A

nll mean: 131.8046875 	 kl mean: 0.05553772300481796 	 loss mean: 131.86021423339844
nll mean: 131.72329711914062 	 kl mean: 0.05553772300481796 	 loss mean: 131.77883911132812
nll mean: 131.774658203125 	 kl mean: 0.05553772300481796 	 loss mean: 131.83018493652344



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.52it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.42it/s][A
                                              
  3%|▎         | 1/38 [00:01<00:14,  2.52it/s][A
                                              
  3%|▎         | 1/38 [00:01<00:14,  2.52it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.46it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.06it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.06it/s]

nll mean: 131.77911376953125 	 kl mean: 0.05553772300481796 	 loss mean: 131.83465576171875
nll mean: 131.87896728515625 	 kl mean: 0.05553772300481796 	 loss mean: 131.93450927734375
nll mean: 131.79624938964844 	 kl mean: 0.05553772300481796 	 loss mean: 131.85179138183594
nll mean: 105.47924041748047 	 kl mean: 0.06401652842760086 	 loss mean: 105.54325103759766



                                              
  5%|▌         | 2/38 [00:01<00:17,  2.06it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.06it/s]
 30%|███       | 3/10 [00:00<00:00, 26.39it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.06it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.06it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.06it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.94it/s][A
                                              
 60%|██████    | 6/10 [00:00<00:00, 25.94it/s]

nll mean: 105.51324462890625 	 kl mean: 0.06401652842760086 	 loss mean: 105.57725524902344
nll mean: 105.49699401855469 	 kl mean: 0.06401652842760086 	 loss mean: 105.56100463867188
nll mean: 105.38294982910156 	 kl mean: 0.06401652842760086 	 loss mean: 105.44696044921875
nll mean: 105.44725799560547 	 kl mean: 0.06401652842760086 	 loss mean: 105.51127624511719
nll mean: 105.37538146972656 	 kl mean: 0.06401652842760086 	 loss mean: 105.43939208984375
nll mean: 105.46785736083984 	 kl mean: 0.06401652842760086 	 loss mean: 105.53187561035156


  5%|▌         | 2/38 [00:01<00:17,  2.06it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.06it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.06it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.65it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 25.42it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.18it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.18it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 105.50149536132812 	 kl mean: 0.06401652842760086 	 loss mean: 105.56551361083984
nll mean: 105.52374267578125 	 kl mean: 0.06401652842760086 	 loss mean: 105.58775329589844
nll mean: 105.44667053222656 	 kl mean: 0.06401652842760086 	 loss mean: 105.51068115234375
nll mean: 143.692138671875 	 kl mean: 0.08155611902475357 	 loss mean: 143.77369689941406


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.18it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.18it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.18it/s]
 20%|██        | 2/10 [00:00<00:00, 11.05it/s][A
 40%|████      | 4/10 [00:00<00:00, 11.05it/s][A

nll mean: 143.803466796875 	 kl mean: 0.08155611902475357 	 loss mean: 143.885009765625
nll mean: 143.7613067626953 	 kl mean: 0.08155611902475357 	 loss mean: 143.84286499023438
nll mean: 143.71315002441406 	 kl mean: 0.08155611902475357 	 loss mean: 143.79470825195312


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.18it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.18it/s]
 40%|████      | 4/10 [00:00<00:00, 11.05it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.18it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.99it/s][A

nll mean: 143.7735595703125 	 kl mean: 0.08155611902475357 	 loss mean: 143.85513305664062
nll mean: 143.80731201171875 	 kl mean: 0.08155611902475357 	 loss mean: 143.88888549804688
nll mean: 143.823974609375 	 kl mean: 0.08155611902475357 	 loss mean: 143.905517578125


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.18it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.99it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.18it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.18it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.98it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.98it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.68it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 143.75411987304688 	 kl mean: 0.08155611902475357 	 loss mean: 143.83566284179688
nll mean: 143.81434631347656 	 kl mean: 0.08155611902475357 	 loss mean: 143.89590454101562
nll mean: 143.81520080566406 	 kl mean: 0.08155611902475357 	 loss mean: 143.89675903320312



                                              
 11%|█         | 4/38 [00:02<00:20,  1.68it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.68it/s]
 20%|██        | 2/10 [00:00<00:00, 14.93it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.68it/s][A

nll mean: 131.35865783691406 	 kl mean: 0.05569155514240265 	 loss mean: 131.4143524169922
nll mean: 131.39923095703125 	 kl mean: 0.05569155514240265 	 loss mean: 131.45492553710938
nll mean: 131.42626953125 	 kl mean: 0.05569155514240265 	 loss mean: 131.48196411132812



                                              
 11%|█         | 4/38 [00:02<00:20,  1.68it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.72it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.68it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.68it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.59it/s][A

nll mean: 131.41079711914062 	 kl mean: 0.05569155514240265 	 loss mean: 131.46649169921875
nll mean: 131.35568237304688 	 kl mean: 0.05569155514240265 	 loss mean: 131.411376953125
nll mean: 131.35958862304688 	 kl mean: 0.05569155514240265 	 loss mean: 131.415283203125



                                              
 11%|█         | 4/38 [00:02<00:20,  1.68it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.68it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.50it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.68it/s][A

nll mean: 131.35708618164062 	 kl mean: 0.05569155514240265 	 loss mean: 131.41278076171875
nll mean: 131.48300170898438 	 kl mean: 0.05569155514240265 	 loss mean: 131.5386962890625
nll mean: 131.37924194335938 	 kl mean: 0.05569155514240265 	 loss mean: 131.4349365234375



                                              
 11%|█         | 4/38 [00:03<00:20,  1.68it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.38it/s][A
 13%|█▎        | 5/38 [00:03<00:20,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.60it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.60it/s]
 20%|██        | 2/10 [00:00<00:00, 14.45it/s][A

nll mean: 131.41009521484375 	 kl mean: 0.05569155514240265 	 loss mean: 131.46578979492188
nll mean: 128.77999877929688 	 kl mean: 0.05137293413281441 	 loss mean: 128.83135986328125
nll mean: 128.86380004882812 	 kl mean: 0.05137293413281441 	 loss mean: 128.91517639160156



                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.60it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.60it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.44it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.60it/s][A

nll mean: 128.80947875976562 	 kl mean: 0.05137293413281441 	 loss mean: 128.86083984375
nll mean: 128.86473083496094 	 kl mean: 0.05137293413281441 	 loss mean: 128.91610717773438
nll mean: 128.7823486328125 	 kl mean: 0.05137293413281441 	 loss mean: 128.833740234375



                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.60it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.40it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.60it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.60it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.56it/s][A

nll mean: 128.87896728515625 	 kl mean: 0.05137293413281441 	 loss mean: 128.93035888671875
nll mean: 128.762939453125 	 kl mean: 0.05137293413281441 	 loss mean: 128.81430053710938
nll mean: 128.75045776367188 	 kl mean: 0.05137293413281441 	 loss mean: 128.80181884765625



                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.60it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.60it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.52it/s][A
 16%|█▌        | 6/38 [00:03<00:20,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.55it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.55it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 25.31it/s][A

nll mean: 128.80616760253906 	 kl mean: 0.05137293413281441 	 loss mean: 128.8575439453125
nll mean: 128.77691650390625 	 kl mean: 0.05137293413281441 	 loss mean: 128.82827758789062
nll mean: 139.17880249023438 	 kl mean: 0.04888860881328583 	 loss mean: 139.22769165039062
nll mean: 139.15245056152344 	 kl mean: 0.04888860881328583 	 loss mean: 139.2013397216797
nll mean: 139.1591033935547 	 kl mean: 0.04888860881328583 	 loss mean: 139.20799255371094



                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.55it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.55it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.15it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.55it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.55it/s][A
                                              
 60%|██████    | 6/10 [00:00<00:00, 25.15it/s]

nll mean: 139.20724487304688 	 kl mean: 0.04888860881328583 	 loss mean: 139.25613403320312
nll mean: 139.1514892578125 	 kl mean: 0.04888860881328583 	 loss mean: 139.2003631591797
nll mean: 139.15829467773438 	 kl mean: 0.04888860881328583 	 loss mean: 139.20718383789062
nll mean: 139.16366577148438 	 kl mean: 0.04888860881328583 	 loss mean: 139.2125701904297
nll mean: 139.11978149414062 	 kl mean: 0.04888860881328583 	 loss mean: 139.16867065429688
nll mean: 139.22817993164062 	 kl mean: 0.04888860881328583 	 loss mean: 139.27708435058594


 16%|█▌        | 6/38 [00:04<00:20,  1.55it/s]
 90%|█████████ | 9/10 [00:00<00:00, 25.13it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 25.03it/s][A
 18%|█▊        | 7/38 [00:04<00:17,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.75it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.75it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.75it/s]
 30%|███       | 3/10 [00:00<00:00, 25.37it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.75it/s][A
                                              

nll mean: 139.14730834960938 	 kl mean: 0.04888860881328583 	 loss mean: 139.1962127685547
nll mean: 112.33650207519531 	 kl mean: 0.061677344143390656 	 loss mean: 112.39817810058594
nll mean: 112.28874206542969 	 kl mean: 0.061677344143390656 	 loss mean: 112.35041809082031
nll mean: 112.36520385742188 	 kl mean: 0.061677344143390656 	 loss mean: 112.4268798828125
nll mean: 112.29582214355469 	 kl mean: 0.061677344143390656 	 loss mean: 112.35750579833984



 18%|█▊        | 7/38 [00:04<00:17,  1.75it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.75it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.29it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.75it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.75it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.75it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.20it/s][A
                                              
 90%|█████████ | 9/10 [00:00<00:00, 25.20it/s]

nll mean: 112.27717590332031 	 kl mean: 0.061677344143390656 	 loss mean: 112.33885955810547
nll mean: 112.41590118408203 	 kl mean: 0.061677344143390656 	 loss mean: 112.47758483886719
nll mean: 112.29715728759766 	 kl mean: 0.061677344143390656 	 loss mean: 112.35884094238281
nll mean: 112.33964538574219 	 kl mean: 0.061677344143390656 	 loss mean: 112.40132904052734
nll mean: 112.314208984375 	 kl mean: 0.061677344143390656 	 loss mean: 112.37588500976562
nll mean: 112.4232406616211 	 kl mean: 0.061677344143390656 	 loss mean: 112.48492431640625


100%|██████████| 10/10 [00:00<00:00, 25.13it/s]
 21%|██        | 8/38 [00:04<00:15,  1.92it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.92it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.92it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.92it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.92it/s]
 20%|██        | 2/10 [00:00<00:00, 15.41it/s][A
 40%|████      | 4/10 [00:00<00:00, 15.31it/s][A

nll mean: 138.18624877929688 	 kl mean: 0.05411480367183685 	 loss mean: 138.2403564453125
nll mean: 138.2417755126953 	 kl mean: 0.05411480367183685 	 loss mean: 138.2958984375
nll mean: 138.19454956054688 	 kl mean: 0.05411480367183685 	 loss mean: 138.24867248535156
nll mean: 138.1681365966797 	 kl mean: 0.05411480367183685 	 loss mean: 138.22225952148438


                                              
 21%|██        | 8/38 [00:04<00:15,  1.92it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.92it/s]
 40%|████      | 4/10 [00:00<00:00, 15.31it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.92it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.92it/s]
 60%|██████    | 6/10 [00:00<00:00, 15.05it/s][A
 80%|████████  | 8/10 [00:00<00:00, 15.27it/s][A

nll mean: 138.09622192382812 	 kl mean: 0.05411480367183685 	 loss mean: 138.15032958984375
nll mean: 138.2265167236328 	 kl mean: 0.05411480367183685 	 loss mean: 138.2806396484375
nll mean: 138.12124633789062 	 kl mean: 0.05411480367183685 	 loss mean: 138.17535400390625
nll mean: 138.16574096679688 	 kl mean: 0.05411480367183685 	 loss mean: 138.2198486328125


                                              
 21%|██        | 8/38 [00:05<00:15,  1.92it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.92it/s]
 80%|████████  | 8/10 [00:00<00:00, 15.27it/s][A
100%|██████████| 10/10 [00:00<00:00, 15.33it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.78it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.78it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.78it/s]

nll mean: 138.116455078125 	 kl mean: 0.05411480367183685 	 loss mean: 138.17056274414062
nll mean: 138.12615966796875 	 kl mean: 0.05411480367183685 	 loss mean: 138.18026733398438
nll mean: 137.80162048339844 	 kl mean: 0.051559992134571075 	 loss mean: 137.85317993164062
nll mean: 137.72897338867188 	 kl mean: 0.051559992134571075 	 loss mean: 137.78054809570312



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.78it/s]
 30%|███       | 3/10 [00:00<00:00, 22.30it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.78it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.78it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.78it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.23it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.78it/s][A

nll mean: 137.775146484375 	 kl mean: 0.051559992134571075 	 loss mean: 137.82672119140625
nll mean: 137.81515502929688 	 kl mean: 0.051559992134571075 	 loss mean: 137.86669921875
nll mean: 137.71957397460938 	 kl mean: 0.051559992134571075 	 loss mean: 137.77114868164062
nll mean: 137.75933837890625 	 kl mean: 0.051559992134571075 	 loss mean: 137.81088256835938
nll mean: 137.7354736328125 	 kl mean: 0.051559992134571075 	 loss mean: 137.78701782226562



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.78it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.78it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.81it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 21.79it/s][A
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s]

nll mean: 137.79507446289062 	 kl mean: 0.051559992134571075 	 loss mean: 137.8466339111328
nll mean: 137.7593994140625 	 kl mean: 0.051559992134571075 	 loss mean: 137.81097412109375
nll mean: 137.77059936523438 	 kl mean: 0.051559992134571075 	 loss mean: 137.8221435546875
nll mean: 124.69821166992188 	 kl mean: 0.04956182837486267 	 loss mean: 124.7477798461914
nll mean: 124.68841552734375 	 kl mean: 0.04956182837486267 	 loss mean: 124.73796844482422



                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s]
 30%|███       | 3/10 [00:00<00:00, 25.24it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.11it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s][A
[A                                           

nll mean: 124.72000885009766 	 kl mean: 0.04956182837486267 	 loss mean: 124.76956939697266
nll mean: 124.59727478027344 	 kl mean: 0.04956182837486267 	 loss mean: 124.64684295654297
nll mean: 124.60639190673828 	 kl mean: 0.04956182837486267 	 loss mean: 124.65595245361328
nll mean: 124.59552764892578 	 kl mean: 0.04956182837486267 	 loss mean: 124.64509582519531
nll mean: 124.60419464111328 	 kl mean: 0.04956182837486267 	 loss mean: 124.65374755859375


                                               
 26%|██▋       | 10/38 [00:06<00:14,  1.88it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:14,  1.88it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.04it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 24.97it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.03it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.03it/s]

nll mean: 124.52117919921875 	 kl mean: 0.04956182837486267 	 loss mean: 124.57073211669922
nll mean: 124.6539077758789 	 kl mean: 0.04956182837486267 	 loss mean: 124.70347595214844
nll mean: 124.61739349365234 	 kl mean: 0.04956182837486267 	 loss mean: 124.66696166992188
nll mean: 146.65249633789062 	 kl mean: 0.0427713617682457 	 loss mean: 146.6952667236328
nll mean: 146.71603393554688 	 kl mean: 0.0427713617682457 	 loss mean: 146.75881958007812



                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.03it/s]
 30%|███       | 3/10 [00:00<00:00, 21.83it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.03it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.03it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.03it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.91it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.03it/s][A

nll mean: 146.74822998046875 	 kl mean: 0.0427713617682457 	 loss mean: 146.79098510742188
nll mean: 146.7011260986328 	 kl mean: 0.0427713617682457 	 loss mean: 146.743896484375
nll mean: 146.68798828125 	 kl mean: 0.0427713617682457 	 loss mean: 146.73077392578125
nll mean: 146.72378540039062 	 kl mean: 0.0427713617682457 	 loss mean: 146.7665557861328
nll mean: 146.63632202148438 	 kl mean: 0.0427713617682457 	 loss mean: 146.67909240722656



                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.03it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.03it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.78it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.65it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.07it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.07it/s]

nll mean: 146.58526611328125 	 kl mean: 0.0427713617682457 	 loss mean: 146.6280517578125
nll mean: 146.63375854492188 	 kl mean: 0.0427713617682457 	 loss mean: 146.67654418945312
nll mean: 146.66419982910156 	 kl mean: 0.0427713617682457 	 loss mean: 146.70697021484375
nll mean: 124.87633514404297 	 kl mean: 0.05092805251479149 	 loss mean: 124.92726135253906



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.07it/s]
 20%|██        | 2/10 [00:00<00:00, 12.91it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.07it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.07it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.81it/s][A

nll mean: 124.87836456298828 	 kl mean: 0.05092805251479149 	 loss mean: 124.92929077148438
nll mean: 124.89703369140625 	 kl mean: 0.05092805251479149 	 loss mean: 124.94796752929688
nll mean: 124.9155502319336 	 kl mean: 0.05092805251479149 	 loss mean: 124.96647644042969



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.07it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.07it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.69it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.07it/s][A

nll mean: 124.91793823242188 	 kl mean: 0.05092805251479149 	 loss mean: 124.96885681152344
nll mean: 124.8587646484375 	 kl mean: 0.05092805251479149 	 loss mean: 124.9096908569336
nll mean: 124.92703247070312 	 kl mean: 0.05092805251479149 	 loss mean: 124.97795867919922



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.07it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.60it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.07it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.07it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.63it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.97636413574219 	 kl mean: 0.05092805251479149 	 loss mean: 125.02729797363281
nll mean: 124.85586547851562 	 kl mean: 0.05092805251479149 	 loss mean: 124.90678405761719
nll mean: 124.79621887207031 	 kl mean: 0.05092805251479149 	 loss mean: 124.8471450805664



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.73it/s]
 10%|█         | 1/10 [00:00<00:00,  9.70it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.73it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.78it/s][A
[A                                           

nll mean: 168.0858612060547 	 kl mean: 0.05743478983640671 	 loss mean: 168.14329528808594
nll mean: 168.1932373046875 	 kl mean: 0.05743478983640671 	 loss mean: 168.25067138671875


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.73it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.81it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.73it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.84it/s][A
                                               

nll mean: 168.13169860839844 	 kl mean: 0.05743478983640671 	 loss mean: 168.18914794921875
nll mean: 168.20504760742188 	 kl mean: 0.05743478983640671 	 loss mean: 168.26248168945312



 34%|███▍      | 13/38 [00:07<00:14,  1.73it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.96it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.73it/s][A

nll mean: 168.1437530517578 	 kl mean: 0.05743478983640671 	 loss mean: 168.20118713378906
nll mean: 168.14093017578125 	 kl mean: 0.05743478983640671 	 loss mean: 168.1983642578125
nll mean: 168.12417602539062 	 kl mean: 0.05743478983640671 	 loss mean: 168.18162536621094



                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.73it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.04it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.73it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.73it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.07it/s][A
 37%|███▋      | 14/38 [00:08<00:16,  1.42it/s]

nll mean: 168.1436004638672 	 kl mean: 0.05743478983640671 	 loss mean: 168.20101928710938
nll mean: 168.17694091796875 	 kl mean: 0.05743478983640671 	 loss mean: 168.234375
nll mean: 168.15325927734375 	 kl mean: 0.05743478983640671 	 loss mean: 168.210693359375



  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.42it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.42it/s]
 20%|██        | 2/10 [00:00<00:00, 18.67it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.42it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.42it/s][A
 40%|████      | 4/10 [00:00<00:00, 18.55it/s][A

nll mean: 140.44631958007812 	 kl mean: 0.0623457208275795 	 loss mean: 140.50865173339844
nll mean: 140.359130859375 	 kl mean: 0.0623457208275795 	 loss mean: 140.42149353027344
nll mean: 140.30947875976562 	 kl mean: 0.0623457208275795 	 loss mean: 140.371826171875
nll mean: 140.36830139160156 	 kl mean: 0.0623457208275795 	 loss mean: 140.43064880371094



                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.42it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.42it/s][A
 60%|██████    | 6/10 [00:00<00:00, 18.49it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.42it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.42it/s][A
 80%|████████  | 8/10 [00:00<00:00, 18.49it/s][A

nll mean: 140.40692138671875 	 kl mean: 0.0623457208275795 	 loss mean: 140.4692840576172
nll mean: 140.3717041015625 	 kl mean: 0.0623457208275795 	 loss mean: 140.43405151367188
nll mean: 140.30902099609375 	 kl mean: 0.0623457208275795 	 loss mean: 140.37136840820312
nll mean: 140.21697998046875 	 kl mean: 0.0623457208275795 	 loss mean: 140.27932739257812



                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.42it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.42it/s][A
100%|██████████| 10/10 [00:00<00:00, 18.42it/s][A
 39%|███▉      | 15/38 [00:08<00:15,  1.52it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 140.25477600097656 	 kl mean: 0.0623457208275795 	 loss mean: 140.31710815429688
nll mean: 140.36190795898438 	 kl mean: 0.0623457208275795 	 loss mean: 140.42425537109375
nll mean: 149.10467529296875 	 kl mean: 0.05650683492422104 	 loss mean: 149.16119384765625


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.52it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.52it/s]
 20%|██        | 2/10 [00:00<00:00, 10.93it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.91it/s][A

nll mean: 149.08555603027344 	 kl mean: 0.05650683492422104 	 loss mean: 149.14205932617188
nll mean: 149.10353088378906 	 kl mean: 0.05650683492422104 	 loss mean: 149.1600341796875
nll mean: 149.08106994628906 	 kl mean: 0.05650683492422104 	 loss mean: 149.1375732421875


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.52it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.52it/s]
 40%|████      | 4/10 [00:00<00:00, 10.91it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.94it/s][A

nll mean: 149.08815002441406 	 kl mean: 0.05650683492422104 	 loss mean: 149.1446533203125
nll mean: 149.07998657226562 	 kl mean: 0.05650683492422104 	 loss mean: 149.13648986816406
nll mean: 149.11094665527344 	 kl mean: 0.05650683492422104 	 loss mean: 149.16744995117188


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.94it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.52it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.52it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.96it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.91it/s][A
 42%|████▏     | 16/38 [00:09<00:16,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 149.04788208007812 	 kl mean: 0.05650683492422104 	 loss mean: 149.10438537597656
nll mean: 149.0616455078125 	 kl mean: 0.05650683492422104 	 loss mean: 149.1181640625
nll mean: 149.18035888671875 	 kl mean: 0.05650683492422104 	 loss mean: 149.23687744140625



                                               
 42%|████▏     | 16/38 [00:09<00:16,  1.36it/s]
                                               
 42%|████▏     | 16/38 [00:09<00:16,  1.36it/s]
                                               
 42%|████▏     | 16/38 [00:09<00:16,  1.36it/s]
 30%|███       | 3/10 [00:00<00:00, 25.38it/s][A
                                               
 42%|████▏     | 16/38 [00:09<00:16,  1.36it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.36it/s][A

nll mean: 149.8246307373047 	 kl mean: 0.07639890909194946 	 loss mean: 149.90103149414062
nll mean: 149.75131225585938 	 kl mean: 0.07639890909194946 	 loss mean: 149.8277130126953
nll mean: 149.7975616455078 	 kl mean: 0.07639890909194946 	 loss mean: 149.87396240234375
nll mean: 149.76939392089844 	 kl mean: 0.07639890909194946 	 loss mean: 149.84579467773438
nll mean: 149.73855590820312 	 kl mean: 0.07639890909194946 	 loss mean: 149.81497192382812



                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.36it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.19it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.36it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.36it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.36it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.14it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.04it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.57it/s]
                                               


nll mean: 149.7854766845703 	 kl mean: 0.07639890909194946 	 loss mean: 149.86187744140625
nll mean: 149.716064453125 	 kl mean: 0.07639890909194946 	 loss mean: 149.79244995117188
nll mean: 149.78575134277344 	 kl mean: 0.07639890909194946 	 loss mean: 149.86215209960938
nll mean: 149.71441650390625 	 kl mean: 0.07639890909194946 	 loss mean: 149.7908172607422
nll mean: 149.81951904296875 	 kl mean: 0.07639890909194946 	 loss mean: 149.8959197998047


 45%|████▍     | 17/38 [00:10<00:13,  1.57it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.57it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.57it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.57it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.57it/s]
 30%|███       | 3/10 [00:00<00:00, 25.94it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.69it/s][A

nll mean: 139.31362915039062 	 kl mean: 0.050050437450408936 	 loss mean: 139.36367797851562
nll mean: 139.39073181152344 	 kl mean: 0.050050437450408936 	 loss mean: 139.44078063964844
nll mean: 139.31588745117188 	 kl mean: 0.050050437450408936 	 loss mean: 139.36593627929688
nll mean: 139.42477416992188 	 kl mean: 0.050050437450408936 	 loss mean: 139.4748077392578
nll mean: 139.3358154296875 	 kl mean: 0.050050437450408936 	 loss mean: 139.3858642578125
nll mean: 139.30810546875 	 kl mean: 0.050050437450408936 	 loss mean: 139.358154296875


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.57it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.57it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.69it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.57it/s]
100%|██████████| 10/10 [00:00<00:00, 25.30it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 139.35763549804688 	 kl mean: 0.050050437450408936 	 loss mean: 139.40768432617188
nll mean: 139.28260803222656 	 kl mean: 0.050050437450408936 	 loss mean: 139.33267211914062
nll mean: 139.44476318359375 	 kl mean: 0.050050437450408936 	 loss mean: 139.49481201171875
nll mean: 139.4346923828125 	 kl mean: 0.050050437450408936 	 loss mean: 139.48477172851562



                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s]
 20%|██        | 2/10 [00:00<00:00, 12.72it/s][A
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s][A

nll mean: 136.71104431152344 	 kl mean: 0.05801922827959061 	 loss mean: 136.76905822753906
nll mean: 136.76995849609375 	 kl mean: 0.05801922827959061 	 loss mean: 136.8280029296875
nll mean: 136.62899780273438 	 kl mean: 0.05801922827959061 	 loss mean: 136.68702697753906



                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.77it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.72it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.77it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.77it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.76it/s][A

nll mean: 136.76002502441406 	 kl mean: 0.05801922827959061 	 loss mean: 136.81805419921875
nll mean: 136.7076416015625 	 kl mean: 0.05801922827959061 	 loss mean: 136.7656707763672
nll mean: 136.79266357421875 	 kl mean: 0.05801922827959061 	 loss mean: 136.85069274902344



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.77it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.77it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.67it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.77it/s][A

nll mean: 136.62234497070312 	 kl mean: 0.05801922827959061 	 loss mean: 136.68035888671875
nll mean: 136.70982360839844 	 kl mean: 0.05801922827959061 	 loss mean: 136.76785278320312
nll mean: 136.73471069335938 	 kl mean: 0.05801922827959061 	 loss mean: 136.792724609375



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.77it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.63it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.61it/s][A

nll mean: 136.75692749023438 	 kl mean: 0.05801922827959061 	 loss mean: 136.81494140625
nll mean: 153.68258666992188 	 kl mean: 0.04644612967967987 	 loss mean: 153.72903442382812
nll mean: 153.7083740234375 	 kl mean: 0.04644612967967987 	 loss mean: 153.7548065185547


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s]
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.61it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s]
 40%|████      | 4/10 [00:00<00:00, 12.52it/s][A

nll mean: 153.66598510742188 	 kl mean: 0.04644612967967987 	 loss mean: 153.7124481201172
nll mean: 153.7032012939453 	 kl mean: 0.04644612967967987 	 loss mean: 153.74966430664062
nll mean: 153.57003784179688 	 kl mean: 0.04644612967967987 	 loss mean: 153.61648559570312


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s]
 40%|████      | 4/10 [00:00<00:00, 12.52it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.47it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.57it/s][A

nll mean: 153.60763549804688 	 kl mean: 0.04644612967967987 	 loss mean: 153.65408325195312
nll mean: 153.66146850585938 	 kl mean: 0.04644612967967987 	 loss mean: 153.70791625976562
nll mean: 153.71414184570312 	 kl mean: 0.04644612967967987 	 loss mean: 153.76058959960938


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.58it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.58it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.57it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.57it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 153.66958618164062 	 kl mean: 0.04644612967967987 	 loss mean: 153.71603393554688
nll mean: 153.76512145996094 	 kl mean: 0.04644612967967987 	 loss mean: 153.81155395507812
nll mean: 161.4363250732422 	 kl mean: 0.059385016560554504 	 loss mean: 161.49569702148438


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
 20%|██        | 2/10 [00:00<00:00, 12.97it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.94it/s][A

nll mean: 161.42674255371094 	 kl mean: 0.059385016560554504 	 loss mean: 161.48614501953125
nll mean: 161.39410400390625 	 kl mean: 0.059385016560554504 	 loss mean: 161.4534912109375
nll mean: 161.43801879882812 	 kl mean: 0.059385016560554504 	 loss mean: 161.49740600585938


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
 40%|████      | 4/10 [00:00<00:00, 12.94it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.99it/s][A

nll mean: 161.4132080078125 	 kl mean: 0.059385016560554504 	 loss mean: 161.47259521484375
nll mean: 161.40020751953125 	 kl mean: 0.059385016560554504 	 loss mean: 161.45960998535156
nll mean: 161.472900390625 	 kl mean: 0.059385016560554504 	 loss mean: 161.53228759765625


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.99it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.93it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.83it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 161.40353393554688 	 kl mean: 0.059385016560554504 	 loss mean: 161.46292114257812
nll mean: 161.44454956054688 	 kl mean: 0.059385016560554504 	 loss mean: 161.50392150878906
nll mean: 161.41726684570312 	 kl mean: 0.059385016560554504 	 loss mean: 161.47665405273438


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 10.38it/s][A

nll mean: 123.31526184082031 	 kl mean: 0.05544523149728775 	 loss mean: 123.37071228027344
nll mean: 123.42332458496094 	 kl mean: 0.05544523149728775 	 loss mean: 123.47876739501953
nll mean: 123.37977600097656 	 kl mean: 0.05544523149728775 	 loss mean: 123.43522644042969


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 10.38it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 10.40it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.35it/s][A

nll mean: 123.36372375488281 	 kl mean: 0.05544523149728775 	 loss mean: 123.41917419433594
nll mean: 123.34815979003906 	 kl mean: 0.05544523149728775 	 loss mean: 123.40360260009766
nll mean: 123.38076782226562 	 kl mean: 0.05544523149728775 	 loss mean: 123.43621063232422


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.35it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.43it/s][A

nll mean: 123.36288452148438 	 kl mean: 0.05544523149728775 	 loss mean: 123.4183349609375
nll mean: 123.35350799560547 	 kl mean: 0.05544523149728775 	 loss mean: 123.4089584350586
nll mean: 123.45111846923828 	 kl mean: 0.05544523149728775 	 loss mean: 123.50655364990234


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.43it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.44it/s][A
 58%|█████▊    | 22/38 [00:13<00:12,  1.27it/s]
                                               
 58%|█████▊    | 22/38 [00:13<00:12,  1.27it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.27it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.27it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.27it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.27it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.27it/s]
 40%|████      | 4/10 [00:00<00:00, 34.09it/s][A

nll mean: 123.43528747558594 	 kl mean: 0.05544523149728775 	 loss mean: 123.49073791503906
nll mean: 111.08750915527344 	 kl mean: 0.039814796298742294 	 loss mean: 111.1273193359375
nll mean: 111.12228393554688 	 kl mean: 0.039814796298742294 	 loss mean: 111.16209411621094
nll mean: 111.1817398071289 	 kl mean: 0.039814796298742294 	 loss mean: 111.2215576171875
nll mean: 111.11570739746094 	 kl mean: 0.039814796298742294 	 loss mean: 111.155517578125
nll mean: 111.09347534179688 	 kl mean: 0.039814796298742294 	 loss mean: 111.13328552246094
nll mean: 111.20711517333984 	 kl mean: 0.039814796298742294 	 loss mean: 111.24693298339844


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.27it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.27it/s]
 40%|████      | 4/10 [00:00<00:00, 34.09it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.27it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.27it/s]
100%|██████████| 10/10 [00:00<00:00, 33.32it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.56it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 111.11343383789062 	 kl mean: 0.039814796298742294 	 loss mean: 111.15325164794922
nll mean: 111.15188598632812 	 kl mean: 0.039814796298742294 	 loss mean: 111.19171142578125
nll mean: 111.24853515625 	 kl mean: 0.039814796298742294 	 loss mean: 111.28834533691406
nll mean: 111.0790786743164 	 kl mean: 0.039814796298742294 	 loss mean: 111.118896484375
nll mean: 163.7589111328125 	 kl mean: 0.05467505753040314 	 loss mean: 163.8135986328125


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.56it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.49it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.54it/s][A

nll mean: 163.879638671875 	 kl mean: 0.05467505753040314 	 loss mean: 163.93431091308594
nll mean: 163.75906372070312 	 kl mean: 0.05467505753040314 	 loss mean: 163.813720703125
nll mean: 163.7436981201172 	 kl mean: 0.05467505753040314 	 loss mean: 163.79837036132812


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.56it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.56it/s]
 40%|████      | 4/10 [00:00<00:00, 14.54it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.56it/s]
                                               [A


nll mean: 163.7152099609375 	 kl mean: 0.05467505753040314 	 loss mean: 163.76986694335938
nll mean: 163.75192260742188 	 kl mean: 0.05467505753040314 	 loss mean: 163.80661010742188
nll mean: 163.75050354003906 	 kl mean: 0.05467505753040314 	 loss mean: 163.80519104003906


 61%|██████    | 23/38 [00:14<00:09,  1.56it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.63it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.56it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.68it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.74it/s][A
 63%|██████▎   | 24/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 63%|██████▎   | 24/38 [00:14<00:09,  1.53it/s]

nll mean: 163.68077087402344 	 kl mean: 0.05467505753040314 	 loss mean: 163.73544311523438
nll mean: 163.69821166992188 	 kl mean: 0.05467505753040314 	 loss mean: 163.75289916992188
nll mean: 163.75999450683594 	 kl mean: 0.05467505753040314 	 loss mean: 163.81466674804688
nll mean: 128.30914306640625 	 kl mean: 0.05359816551208496 	 loss mean: 128.36273193359375



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.53it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.53it/s]
 30%|███       | 3/10 [00:00<00:00, 22.54it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.53it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.53it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.53it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.41it/s][A

nll mean: 128.3239288330078 	 kl mean: 0.05359816551208496 	 loss mean: 128.37753295898438
nll mean: 128.40350341796875 	 kl mean: 0.05359816551208496 	 loss mean: 128.4571075439453
nll mean: 128.40814208984375 	 kl mean: 0.05359816551208496 	 loss mean: 128.46176147460938
nll mean: 128.42611694335938 	 kl mean: 0.05359816551208496 	 loss mean: 128.47970581054688
nll mean: 128.41610717773438 	 kl mean: 0.05359816551208496 	 loss mean: 128.46971130371094



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.53it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.53it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.53it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.24it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 22.09it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.68it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 128.42564392089844 	 kl mean: 0.05359816551208496 	 loss mean: 128.479248046875
nll mean: 128.4193878173828 	 kl mean: 0.05359816551208496 	 loss mean: 128.47299194335938
nll mean: 128.41554260253906 	 kl mean: 0.05359816551208496 	 loss mean: 128.46914672851562
nll mean: 128.4356689453125 	 kl mean: 0.05359816551208496 	 loss mean: 128.4892578125



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.68it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.68it/s]
 20%|██        | 2/10 [00:00<00:00, 14.96it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.68it/s][A
                                               

nll mean: 120.65596008300781 	 kl mean: 0.057830389589071274 	 loss mean: 120.71379089355469
nll mean: 120.60739135742188 	 kl mean: 0.057830389589071274 	 loss mean: 120.66521453857422
nll mean: 120.62493896484375 	 kl mean: 0.057830389589071274 	 loss mean: 120.68276977539062



 66%|██████▌   | 25/38 [00:15<00:07,  1.68it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.99it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.68it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.68it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.98it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.68it/s][A
                                               

nll mean: 120.61509704589844 	 kl mean: 0.057830389589071274 	 loss mean: 120.67292785644531
nll mean: 120.49237060546875 	 kl mean: 0.057830389589071274 	 loss mean: 120.55020141601562
nll mean: 120.60374450683594 	 kl mean: 0.057830389589071274 	 loss mean: 120.66158294677734
nll mean: 120.67461395263672 	 kl mean: 0.057830389589071274 	 loss mean: 120.7324447631836



 66%|██████▌   | 25/38 [00:15<00:07,  1.68it/s][A
 80%|████████  | 8/10 [00:00<00:00, 15.03it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.68it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.68it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.99it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s]

nll mean: 120.56697082519531 	 kl mean: 0.057830389589071274 	 loss mean: 120.62479400634766
nll mean: 120.63785552978516 	 kl mean: 0.057830389589071274 	 loss mean: 120.69569396972656
nll mean: 120.55787658691406 	 kl mean: 0.057830389589071274 	 loss mean: 120.61570739746094
nll mean: 87.39065551757812 	 kl mean: 0.10786885023117065 	 loss mean: 87.49852752685547



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s]
 30%|███       | 3/10 [00:00<00:00, 21.70it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.84it/s][A

nll mean: 87.42894744873047 	 kl mean: 0.10786885023117065 	 loss mean: 87.53681945800781
nll mean: 87.39469909667969 	 kl mean: 0.10786885023117065 	 loss mean: 87.50257873535156
nll mean: 87.40087890625 	 kl mean: 0.10786885023117065 	 loss mean: 87.50875854492188
nll mean: 87.33358764648438 	 kl mean: 0.10786885023117065 	 loss mean: 87.44145202636719
nll mean: 87.36949157714844 	 kl mean: 0.10786885023117065 	 loss mean: 87.47735595703125



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.62it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.01it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 22.17it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]

nll mean: 87.355224609375 	 kl mean: 0.10786885023117065 	 loss mean: 87.46310424804688
nll mean: 87.40312194824219 	 kl mean: 0.10786885023117065 	 loss mean: 87.510986328125
nll mean: 87.4384765625 	 kl mean: 0.10786885023117065 	 loss mean: 87.54635620117188
nll mean: 87.46040344238281 	 kl mean: 0.10786885023117065 	 loss mean: 87.56827545166016
nll mean: 114.26921081542969 	 kl mean: 0.04073631018400192 	 loss mean: 114.30995178222656



                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
 30%|███       | 3/10 [00:00<00:00, 20.63it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s][A
 60%|██████    | 6/10 [00:00<00:00, 20.77it/s][A

nll mean: 114.22698974609375 	 kl mean: 0.04073631018400192 	 loss mean: 114.26773071289062
nll mean: 114.22819519042969 	 kl mean: 0.04073631018400192 	 loss mean: 114.26893615722656
nll mean: 114.20408630371094 	 kl mean: 0.04073631018400192 	 loss mean: 114.24482727050781
nll mean: 114.14088439941406 	 kl mean: 0.04073631018400192 	 loss mean: 114.18162536621094
nll mean: 114.27247619628906 	 kl mean: 0.04073631018400192 	 loss mean: 114.31321716308594



                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 20.71it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 20.71it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 114.23027801513672 	 kl mean: 0.04073631018400192 	 loss mean: 114.27101135253906
nll mean: 114.15650177001953 	 kl mean: 0.04073631018400192 	 loss mean: 114.19723510742188
nll mean: 114.18539428710938 	 kl mean: 0.04073631018400192 	 loss mean: 114.22613525390625
nll mean: 114.1722412109375 	 kl mean: 0.04073631018400192 	 loss mean: 114.21297454833984



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 11.74it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A

nll mean: 126.36167907714844 	 kl mean: 0.05378459393978119 	 loss mean: 126.41546630859375
nll mean: 126.33072662353516 	 kl mean: 0.05378459393978119 	 loss mean: 126.38451385498047
nll mean: 126.36735534667969 	 kl mean: 0.05378459393978119 	 loss mean: 126.42115020751953



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 40%|████      | 4/10 [00:00<00:00, 11.86it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 60%|██████    | 6/10 [00:00<00:00, 11.90it/s][A

nll mean: 126.36302185058594 	 kl mean: 0.05378459393978119 	 loss mean: 126.41679382324219
nll mean: 126.33056640625 	 kl mean: 0.05378459393978119 	 loss mean: 126.38435363769531
nll mean: 126.3438949584961 	 kl mean: 0.05378459393978119 	 loss mean: 126.39767456054688



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 80%|████████  | 8/10 [00:00<00:00, 11.80it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A

nll mean: 126.36844635009766 	 kl mean: 0.05378459393978119 	 loss mean: 126.4222412109375
nll mean: 126.29756164550781 	 kl mean: 0.05378459393978119 	 loss mean: 126.3513412475586
nll mean: 126.35009765625 	 kl mean: 0.05378459393978119 	 loss mean: 126.40388488769531



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
100%|██████████| 10/10 [00:00<00:00, 11.85it/s][A
 76%|███████▋  | 29/38 [00:17<00:05,  1.58it/s]
                                               
 76%|███████▋  | 29/38 [00:17<00:05,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:00,  9.48it/s][A

nll mean: 126.24559020996094 	 kl mean: 0.05378459393978119 	 loss mean: 126.29936218261719
nll mean: 67.29618835449219 	 kl mean: 0.04368635267019272 	 loss mean: 67.33987426757812


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.58it/s]
 10%|█         | 1/10 [00:00<00:00,  9.48it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00,  9.44it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.57it/s][A

nll mean: 67.1792221069336 	 kl mean: 0.04368635267019272 	 loss mean: 67.22291564941406
nll mean: 67.197021484375 	 kl mean: 0.04368635267019272 	 loss mean: 67.24070739746094


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.58it/s]
 30%|███       | 3/10 [00:00<00:00,  9.57it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.58it/s]
 40%|████      | 4/10 [00:00<00:00,  9.58it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.59it/s][A

nll mean: 67.26145935058594 	 kl mean: 0.04368635267019272 	 loss mean: 67.3051528930664
nll mean: 67.2306900024414 	 kl mean: 0.04368635267019272 	 loss mean: 67.27437591552734


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.58it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.59it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.62it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.64it/s][A

nll mean: 67.34273529052734 	 kl mean: 0.04368635267019272 	 loss mean: 67.38642120361328
nll mean: 67.24909973144531 	 kl mean: 0.04368635267019272 	 loss mean: 67.29278564453125


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.58it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.64it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.58it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.67it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.64it/s][A

nll mean: 67.21015930175781 	 kl mean: 0.04368635267019272 	 loss mean: 67.25385284423828
nll mean: 67.27647399902344 	 kl mean: 0.04368635267019272 	 loss mean: 67.32015991210938


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.58it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.64it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.58it/s][A
 79%|███████▉  | 30/38 [00:18<00:06,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 79%|███████▉  | 30/38 [00:18<00:06,  1.32it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:06,  1.32it/s]
 20%|██        | 2/10 [00:00<00:00, 12.32it/s][A

nll mean: 67.25743103027344 	 kl mean: 0.04368635267019272 	 loss mean: 67.30110931396484
nll mean: 110.06246185302734 	 kl mean: 0.07960797846317291 	 loss mean: 110.14207458496094
nll mean: 110.03124237060547 	 kl mean: 0.07960797846317291 	 loss mean: 110.11085510253906



                                               
 79%|███████▉  | 30/38 [00:19<00:06,  1.32it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:06,  1.32it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.35it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:06,  1.32it/s][A

nll mean: 110.03475952148438 	 kl mean: 0.07960797846317291 	 loss mean: 110.11436462402344
nll mean: 110.01974487304688 	 kl mean: 0.07960797846317291 	 loss mean: 110.09934997558594
nll mean: 109.95478820800781 	 kl mean: 0.07960797846317291 	 loss mean: 110.03440856933594



                                               
 79%|███████▉  | 30/38 [00:19<00:06,  1.32it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.36it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:06,  1.32it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:06,  1.32it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.41it/s][A

nll mean: 109.97674560546875 	 kl mean: 0.07960797846317291 	 loss mean: 110.05635833740234
nll mean: 110.00798034667969 	 kl mean: 0.07960797846317291 	 loss mean: 110.08758544921875
nll mean: 110.02677917480469 	 kl mean: 0.07960797846317291 	 loss mean: 110.10638427734375



                                               
 79%|███████▉  | 30/38 [00:19<00:06,  1.32it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:06,  1.32it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.35it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.29it/s]
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.29it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:00,  9.72it/s][A

nll mean: 110.00003051757812 	 kl mean: 0.07960797846317291 	 loss mean: 110.07962799072266
nll mean: 110.0210189819336 	 kl mean: 0.07960797846317291 	 loss mean: 110.10061645507812
nll mean: 144.24630737304688 	 kl mean: 0.07209731638431549 	 loss mean: 144.3184051513672


                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.29it/s]
 10%|█         | 1/10 [00:00<00:00,  9.72it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.29it/s]
 20%|██        | 2/10 [00:00<00:00,  9.71it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.65it/s][A

nll mean: 144.151611328125 	 kl mean: 0.07209731638431549 	 loss mean: 144.22372436523438
nll mean: 144.22286987304688 	 kl mean: 0.07209731638431549 	 loss mean: 144.29498291015625


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.29it/s]
 30%|███       | 3/10 [00:00<00:00,  9.65it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.29it/s]
 40%|████      | 4/10 [00:00<00:00,  9.58it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.50it/s][A

nll mean: 144.20074462890625 	 kl mean: 0.07209731638431549 	 loss mean: 144.27284240722656
nll mean: 144.30172729492188 	 kl mean: 0.07209731638431549 	 loss mean: 144.37384033203125


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.29it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.50it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.29it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.57it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.59it/s][A

nll mean: 144.2777557373047 	 kl mean: 0.07209731638431549 	 loss mean: 144.349853515625
nll mean: 144.17608642578125 	 kl mean: 0.07209731638431549 	 loss mean: 144.2481689453125


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.29it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.59it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.29it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.63it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.56it/s][A

nll mean: 144.22763061523438 	 kl mean: 0.07209731638431549 	 loss mean: 144.2997283935547
nll mean: 144.30035400390625 	 kl mean: 0.07209731638431549 	 loss mean: 144.37245178222656


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.29it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.56it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.54it/s][A
 84%|████████▍ | 32/38 [00:20<00:05,  1.17it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:05,  1.17it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:05,  1.17it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:05,  1.17it/s]
 30%|███       | 3/10 [00:00<00:00, 24.85it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:05,  1.17it/s][A

nll mean: 144.20335388183594 	 kl mean: 0.07209731638431549 	 loss mean: 144.27545166015625
nll mean: 68.61158752441406 	 kl mean: 0.0506645105779171 	 loss mean: 68.6622543334961
nll mean: 68.65335845947266 	 kl mean: 0.0506645105779171 	 loss mean: 68.70401763916016
nll mean: 68.5602035522461 	 kl mean: 0.0506645105779171 	 loss mean: 68.61087036132812
nll mean: 68.60160827636719 	 kl mean: 0.0506645105779171 	 loss mean: 68.65226745605469



                                               
 84%|████████▍ | 32/38 [00:20<00:05,  1.17it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.17it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.62it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.17it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.17it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.17it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.53it/s][A

nll mean: 68.60845947265625 	 kl mean: 0.0506645105779171 	 loss mean: 68.65912628173828
nll mean: 68.50335693359375 	 kl mean: 0.0506645105779171 	 loss mean: 68.55402374267578
nll mean: 68.69364929199219 	 kl mean: 0.0506645105779171 	 loss mean: 68.74431610107422
nll mean: 68.58932495117188 	 kl mean: 0.0506645105779171 	 loss mean: 68.6399917602539
nll mean: 68.58821868896484 	 kl mean: 0.0506645105779171 	 loss mean: 68.63888549804688



                                               
100%|██████████| 10/10 [00:00<00:00, 24.41it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.38it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.38it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.38it/s]
 30%|███       | 3/10 [00:00<00:00, 20.84it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.38it/s][A

nll mean: 68.60529327392578 	 kl mean: 0.0506645105779171 	 loss mean: 68.65596008300781
nll mean: 124.14991760253906 	 kl mean: 0.06799077987670898 	 loss mean: 124.2178955078125
nll mean: 124.18168640136719 	 kl mean: 0.06799077987670898 	 loss mean: 124.24967956542969
nll mean: 124.21866607666016 	 kl mean: 0.06799077987670898 	 loss mean: 124.28665161132812
nll mean: 124.08160400390625 	 kl mean: 0.06799077987670898 	 loss mean: 124.14959716796875



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.38it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.38it/s][A
 60%|██████    | 6/10 [00:00<00:00, 20.87it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.38it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.38it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.38it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 20.98it/s][A

nll mean: 124.14505004882812 	 kl mean: 0.06799077987670898 	 loss mean: 124.2130355834961
nll mean: 124.236572265625 	 kl mean: 0.06799077987670898 	 loss mean: 124.30455780029297
nll mean: 124.01113891601562 	 kl mean: 0.06799077987670898 	 loss mean: 124.0791244506836
nll mean: 124.08228302001953 	 kl mean: 0.06799077987670898 	 loss mean: 124.15027618408203
nll mean: 124.16799926757812 	 kl mean: 0.06799077987670898 	 loss mean: 124.23599243164062



                                               
100%|██████████| 10/10 [00:00<00:00, 21.04it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.54it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.54it/s]
 20%|██        | 2/10 [00:00<00:00, 12.43it/s][A

nll mean: 124.22969055175781 	 kl mean: 0.06799077987670898 	 loss mean: 124.29768371582031
nll mean: 126.20558166503906 	 kl mean: 0.0418442040681839 	 loss mean: 126.24742126464844
nll mean: 126.18933868408203 	 kl mean: 0.0418442040681839 	 loss mean: 126.23118591308594



                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.54it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.54it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.40it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.54it/s][A

nll mean: 126.23127746582031 	 kl mean: 0.0418442040681839 	 loss mean: 126.27312469482422
nll mean: 126.14218139648438 	 kl mean: 0.0418442040681839 	 loss mean: 126.18402862548828
nll mean: 126.17858123779297 	 kl mean: 0.0418442040681839 	 loss mean: 126.22042846679688



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.54it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.39it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.54it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.54it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.37it/s][A

nll mean: 126.15956115722656 	 kl mean: 0.0418442040681839 	 loss mean: 126.201416015625
nll mean: 126.05308532714844 	 kl mean: 0.0418442040681839 	 loss mean: 126.09494018554688
nll mean: 126.09541320800781 	 kl mean: 0.0418442040681839 	 loss mean: 126.13726043701172



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.54it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.54it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.35it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.43it/s]

nll mean: 126.19731140136719 	 kl mean: 0.0418442040681839 	 loss mean: 126.2391586303711
nll mean: 126.21605682373047 	 kl mean: 0.0418442040681839 	 loss mean: 126.25789642333984
nll mean: 117.74310302734375 	 kl mean: 0.06847818195819855 	 loss mean: 117.81158447265625



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.43it/s]
 20%|██        | 2/10 [00:00<00:00, 10.61it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.43it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.43it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.59it/s][A

nll mean: 117.88176727294922 	 kl mean: 0.06847818195819855 	 loss mean: 117.95024108886719
nll mean: 117.88581085205078 	 kl mean: 0.06847818195819855 	 loss mean: 117.95428466796875
nll mean: 117.90377044677734 	 kl mean: 0.06847818195819855 	 loss mean: 117.97225189208984



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.43it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.43it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.56it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.43it/s][A

nll mean: 117.86761474609375 	 kl mean: 0.06847818195819855 	 loss mean: 117.93609619140625
nll mean: 117.865966796875 	 kl mean: 0.06847818195819855 	 loss mean: 117.9344482421875
nll mean: 117.8311996459961 	 kl mean: 0.06847818195819855 	 loss mean: 117.8996810913086



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.43it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.54it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.43it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.43it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.50it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.29it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 117.99697875976562 	 kl mean: 0.06847818195819855 	 loss mean: 118.06544494628906
nll mean: 117.86750793457031 	 kl mean: 0.06847818195819855 	 loss mean: 117.93598937988281
nll mean: 117.82299041748047 	 kl mean: 0.06847818195819855 	 loss mean: 117.89146423339844



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.29it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.29it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.29it/s]
 30%|███       | 3/10 [00:00<00:00, 23.25it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.29it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.29it/s][A

nll mean: 116.71792602539062 	 kl mean: 0.0614810511469841 	 loss mean: 116.77940368652344
nll mean: 116.72998809814453 	 kl mean: 0.0614810511469841 	 loss mean: 116.79146575927734
nll mean: 116.68624114990234 	 kl mean: 0.0614810511469841 	 loss mean: 116.74772644042969
nll mean: 116.61521911621094 	 kl mean: 0.0614810511469841 	 loss mean: 116.67669677734375
nll mean: 116.68667602539062 	 kl mean: 0.0614810511469841 	 loss mean: 116.74815368652344



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.29it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.61it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.29it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.29it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.29it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.35it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.86it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 116.64645385742188 	 kl mean: 0.0614810511469841 	 loss mean: 116.70792388916016
nll mean: 116.57838439941406 	 kl mean: 0.0614810511469841 	 loss mean: 116.63986206054688
nll mean: 116.67903137207031 	 kl mean: 0.0614810511469841 	 loss mean: 116.74050903320312
nll mean: 116.69420623779297 	 kl mean: 0.0614810511469841 	 loss mean: 116.75568389892578
nll mean: 116.61673736572266 	 kl mean: 0.0614810511469841 	 loss mean: 116.67821502685547



                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.47it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.47it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.47it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
 40%|████      | 4/10 [00:00<00:00, 31.08it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s][A

nll mean: 90.4976806640625 	 kl mean: 0.03874246031045914 	 loss mean: 90.53642272949219
nll mean: 90.47701263427734 	 kl mean: 0.03874246031045914 	 loss mean: 90.51576232910156
nll mean: 90.50786590576172 	 kl mean: 0.03874246031045914 	 loss mean: 90.54660034179688
nll mean: 90.47795867919922 	 kl mean: 0.03874246031045914 	 loss mean: 90.51670837402344
nll mean: 90.48179626464844 	 kl mean: 0.03874246031045914 	 loss mean: 90.5205307006836
nll mean: 90.4749755859375 	 kl mean: 0.03874246031045914 	 loss mean: 90.51372528076172
nll mean: 90.48918151855469 	 kl mean: 0.03874246031045914 	 loss mean: 90.52791595458984



                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s][A
 80%|████████  | 8/10 [00:00<00:00, 30.67it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 30.52it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.57it/s]


nll mean: 90.40907287597656 	 kl mean: 0.03874246031045914 	 loss mean: 90.44781494140625
nll mean: 90.53271484375 	 kl mean: 0.03874246031045914 	 loss mean: 90.57145690917969
nll mean: 90.54978942871094 	 kl mean: 0.03874246031045914 	 loss mean: 90.5885238647461
Approximate NLL:
tensor(127.0737, device='cuda:0')
Approximate KL:
tensor(0.0573, device='cuda:0')
Testing took 0:00:25.174618


  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .87it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .87it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .87it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        


nll mean: 115.93900299072266 	 kl mean: 0.06263197213411331 	 loss mean: 116.00163269042969
nll mean: 115.8943099975586 	 kl mean: 0.06263197213411331 	 loss mean: 115.95693969726562
nll mean: 115.87395477294922 	 kl mean: 0.06263197213411331 	 loss mean: 115.93658447265625
nll mean: 115.95991516113281 	 kl mean: 0.06263197213411331 	 loss mean: 116.02254486083984
nll mean: 115.78607177734375 	 kl mean: 0.06263197213411331 	 loss mean: 115.84870147705078
nll mean: 115.89356231689453 	 kl mean: 0.06263197213411331 	 loss mean: 115.9561996459961


 30%|███       | 3/10 [00:00<00:00, 25.87it/s][A
                                      .63it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .63it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .63it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 25.63it/s][A
                                      .34it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 25.16it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 115.84300231933594 	 kl mean: 0.06263197213411331 	 loss mean: 115.90562438964844
nll mean: 115.89871978759766 	 kl mean: 0.06263197213411331 	 loss mean: 115.96134948730469
nll mean: 116.01022338867188 	 kl mean: 0.06263197213411331 	 loss mean: 116.0728530883789
nll mean: 115.97905731201172 	 kl mean: 0.06263197213411331 	 loss mean: 116.04168701171875
nll mean: 132.40850830078125 	 kl mean: 0.06534126400947571 	 loss mean: 132.47384643554688


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 20%|██        | 2/10 [00:00<00:00, 14.28it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.15it/s][A

nll mean: 132.52743530273438 	 kl mean: 0.06534126400947571 	 loss mean: 132.5927734375
nll mean: 132.32159423828125 	 kl mean: 0.06534126400947571 	 loss mean: 132.38693237304688
nll mean: 132.47161865234375 	 kl mean: 0.06534126400947571 	 loss mean: 132.53695678710938


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 40%|████      | 4/10 [00:00<00:00, 14.15it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.20it/s][A

nll mean: 132.48678588867188 	 kl mean: 0.06534126400947571 	 loss mean: 132.5521240234375
nll mean: 132.51327514648438 	 kl mean: 0.06534126400947571 	 loss mean: 132.57861328125
nll mean: 132.46214294433594 	 kl mean: 0.06534126400947571 	 loss mean: 132.52748107910156


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.20it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.50it/s]
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.16it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.18it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 132.45001220703125 	 kl mean: 0.06534126400947571 	 loss mean: 132.51535034179688
nll mean: 132.41397094726562 	 kl mean: 0.06534126400947571 	 loss mean: 132.47930908203125
nll mean: 132.36068725585938 	 kl mean: 0.06534126400947571 	 loss mean: 132.42604064941406
nll mean: 104.5183334350586 	 kl mean: 0.07421138882637024 	 loss mean: 104.59254455566406


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 30%|███       | 3/10 [00:00<00:00, 23.97it/s][A
 60%|██████    | 6/10 [00:00<00:00, 23.59it/s][A

nll mean: 104.52957153320312 	 kl mean: 0.07421138882637024 	 loss mean: 104.6037826538086
nll mean: 104.55663299560547 	 kl mean: 0.07421138882637024 	 loss mean: 104.63084411621094
nll mean: 104.55525970458984 	 kl mean: 0.07421138882637024 	 loss mean: 104.62946319580078
nll mean: 104.56555938720703 	 kl mean: 0.07421138882637024 	 loss mean: 104.63976287841797
nll mean: 104.59276580810547 	 kl mean: 0.07421138882637024 	 loss mean: 104.66697692871094


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 60%|██████    | 6/10 [00:00<00:00, 23.59it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
100%|██████████| 10/10 [00:00<00:00, 22.77it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 104.54168701171875 	 kl mean: 0.07421138882637024 	 loss mean: 104.61589050292969
nll mean: 104.5361328125 	 kl mean: 0.07421138882637024 	 loss mean: 104.6103515625
nll mean: 104.62356567382812 	 kl mean: 0.07421138882637024 	 loss mean: 104.69778442382812
nll mean: 104.46070861816406 	 kl mean: 0.07421138882637024 	 loss mean: 104.534912109375


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
 10%|█         | 1/10 [00:00<00:00,  9.08it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.56it/s][A

nll mean: 143.5906982421875 	 kl mean: 0.0817456841468811 	 loss mean: 143.67242431640625
nll mean: 143.69366455078125 	 kl mean: 0.0817456841468811 	 loss mean: 143.77542114257812
nll mean: 143.7548828125 	 kl mean: 0.0817456841468811 	 loss mean: 143.83663940429688


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 30%|███       | 3/10 [00:00<00:00,  9.56it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.08it/s][A

nll mean: 143.73297119140625 	 kl mean: 0.0817456841468811 	 loss mean: 143.81472778320312
nll mean: 143.72726440429688 	 kl mean: 0.0817456841468811 	 loss mean: 143.80902099609375
nll mean: 143.68682861328125 	 kl mean: 0.0817456841468811 	 loss mean: 143.76858520507812


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.08it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.38it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 10.52it/s][A

nll mean: 143.59228515625 	 kl mean: 0.0817456841468811 	 loss mean: 143.6740264892578
nll mean: 143.60263061523438 	 kl mean: 0.0817456841468811 	 loss mean: 143.6843719482422
nll mean: 143.66082763671875 	 kl mean: 0.0817456841468811 	 loss mean: 143.74256896972656


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
100%|██████████| 10/10 [00:00<00:00, 10.83it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.71it/s][A

nll mean: 143.79425048828125 	 kl mean: 0.0817456841468811 	 loss mean: 143.87600708007812
nll mean: 130.7198486328125 	 kl mean: 0.06832308322191238 	 loss mean: 130.78817749023438
nll mean: 130.6829833984375 	 kl mean: 0.06832308322191238 	 loss mean: 130.75131225585938


                                              
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
 20%|██        | 2/10 [00:00<00:00, 14.71it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
 40%|████      | 4/10 [00:00<00:00, 14.58it/s][A

nll mean: 130.75665283203125 	 kl mean: 0.06832308322191238 	 loss mean: 130.82498168945312
nll mean: 130.8424072265625 	 kl mean: 0.06832308322191238 	 loss mean: 130.91073608398438
nll mean: 130.78176879882812 	 kl mean: 0.06832308322191238 	 loss mean: 130.85009765625


                                              
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
 40%|████      | 4/10 [00:00<00:00, 14.58it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.63it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.59it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.47it/s][A

nll mean: 130.734375 	 kl mean: 0.06832308322191238 	 loss mean: 130.80270385742188
nll mean: 130.75341796875 	 kl mean: 0.06832308322191238 	 loss mean: 130.8217315673828
nll mean: 130.6357421875 	 kl mean: 0.06832308322191238 	 loss mean: 130.70407104492188


                                              
 11%|█         | 4/38 [00:03<00:20,  1.63it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.63it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.47it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.38it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 130.82870483398438 	 kl mean: 0.06832308322191238 	 loss mean: 130.89703369140625
nll mean: 130.7286834716797 	 kl mean: 0.06832308322191238 	 loss mean: 130.7969970703125
nll mean: 128.71249389648438 	 kl mean: 0.06707435846328735 	 loss mean: 128.77957153320312


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 15.88it/s][A
 40%|████      | 4/10 [00:00<00:00, 15.33it/s][A

nll mean: 128.78260803222656 	 kl mean: 0.06707435846328735 	 loss mean: 128.84967041015625
nll mean: 128.73196411132812 	 kl mean: 0.06707435846328735 	 loss mean: 128.79904174804688
nll mean: 128.76199340820312 	 kl mean: 0.06707435846328735 	 loss mean: 128.82907104492188


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 40%|████      | 4/10 [00:00<00:00, 15.33it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.88it/s][A

nll mean: 128.75143432617188 	 kl mean: 0.06707435846328735 	 loss mean: 128.81851196289062
nll mean: 128.7088623046875 	 kl mean: 0.06707435846328735 	 loss mean: 128.77593994140625
nll mean: 128.7191925048828 	 kl mean: 0.06707435846328735 	 loss mean: 128.78627014160156


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.88it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.76it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.49it/s][A
 16%|█▌        | 6/38 [00:03<00:20,  1.53it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 128.7275390625 	 kl mean: 0.06707435846328735 	 loss mean: 128.79461669921875
nll mean: 128.68910217285156 	 kl mean: 0.06707435846328735 	 loss mean: 128.75616455078125
nll mean: 128.65338134765625 	 kl mean: 0.06707435846328735 	 loss mean: 128.720458984375
nll mean: 137.67672729492188 	 kl mean: 0.06278623640537262 	 loss mean: 137.73951721191406


                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.53it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:20,  1.53it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:20,  1.53it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:20,  1.53it/s]
 30%|███       | 3/10 [00:00<00:00, 25.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.37it/s][A

nll mean: 137.66165161132812 	 kl mean: 0.06278623640537262 	 loss mean: 137.72442626953125
nll mean: 137.7346649169922 	 kl mean: 0.06278623640537262 	 loss mean: 137.79745483398438
nll mean: 137.7243194580078 	 kl mean: 0.06278623640537262 	 loss mean: 137.787109375
nll mean: 137.77401733398438 	 kl mean: 0.06278623640537262 	 loss mean: 137.83680725097656
nll mean: 137.609130859375 	 kl mean: 0.06278623640537262 	 loss mean: 137.67193603515625


                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.53it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:20,  1.53it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:20,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.37it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:20,  1.53it/s]
100%|██████████| 10/10 [00:00<00:00, 25.00it/s][A
 18%|█▊        | 7/38 [00:04<00:17,  1.73it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 137.7611083984375 	 kl mean: 0.06278623640537262 	 loss mean: 137.82388305664062
nll mean: 137.71563720703125 	 kl mean: 0.06278623640537262 	 loss mean: 137.77841186523438
nll mean: 137.7673797607422 	 kl mean: 0.06278623640537262 	 loss mean: 137.83016967773438
nll mean: 137.7119598388672 	 kl mean: 0.06278623640537262 	 loss mean: 137.77474975585938
nll mean: 110.9185562133789 	 kl mean: 0.06991507112979889 	 loss mean: 110.98847961425781


                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.73it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.73it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.73it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 25.15it/s][A
                                              [A

nll mean: 110.97637176513672 	 kl mean: 0.06991507112979889 	 loss mean: 111.04629516601562
nll mean: 110.97408294677734 	 kl mean: 0.06991507112979889 	 loss mean: 111.04399871826172
nll mean: 110.98982238769531 	 kl mean: 0.06991507112979889 	 loss mean: 111.05973815917969
nll mean: 110.999267578125 	 kl mean: 0.06991507112979889 	 loss mean: 111.06918334960938
nll mean: 110.99639892578125 	 kl mean: 0.06991507112979889 	 loss mean: 111.06631469726562



 18%|█▊        | 7/38 [00:04<00:17,  1.73it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.73it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.07it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:17,  1.73it/s]
100%|██████████| 10/10 [00:00<00:00, 24.91it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 110.9459457397461 	 kl mean: 0.06991507112979889 	 loss mean: 111.01586151123047
nll mean: 110.9976806640625 	 kl mean: 0.06991507112979889 	 loss mean: 111.06759643554688
nll mean: 110.98138427734375 	 kl mean: 0.06991507112979889 	 loss mean: 111.05130004882812
nll mean: 110.97662353515625 	 kl mean: 0.06991507112979889 	 loss mean: 111.04653930664062
nll mean: 137.75804138183594 	 kl mean: 0.06461641192436218 	 loss mean: 137.82266235351562


                                              
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
 20%|██        | 2/10 [00:00<00:00, 14.52it/s][A
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
 40%|████      | 4/10 [00:00<00:00, 14.99it/s][A

nll mean: 137.85035705566406 	 kl mean: 0.06461641192436218 	 loss mean: 137.9149627685547
nll mean: 137.66412353515625 	 kl mean: 0.06461641192436218 	 loss mean: 137.72872924804688
nll mean: 137.67904663085938 	 kl mean: 0.06461641192436218 	 loss mean: 137.74365234375
nll mean: 137.74810791015625 	 kl mean: 0.06461641192436218 	 loss mean: 137.81271362304688


                                              
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
 40%|████      | 4/10 [00:00<00:00, 14.99it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.97it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
 80%|████████  | 8/10 [00:00<00:00, 15.18it/s][A

nll mean: 137.71450805664062 	 kl mean: 0.06461641192436218 	 loss mean: 137.77911376953125
nll mean: 137.86509704589844 	 kl mean: 0.06461641192436218 	 loss mean: 137.92971801757812
nll mean: 137.75906372070312 	 kl mean: 0.06461641192436218 	 loss mean: 137.8236846923828
nll mean: 137.63818359375 	 kl mean: 0.06461641192436218 	 loss mean: 137.7028045654297


                                              
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
 80%|████████  | 8/10 [00:00<00:00, 15.18it/s][A
100%|██████████| 10/10 [00:00<00:00, 15.41it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
 30%|███       | 3/10 [00:00<00:00, 22.38it/s][A

nll mean: 137.73504638671875 	 kl mean: 0.06461641192436218 	 loss mean: 137.79965209960938
nll mean: 137.48507690429688 	 kl mean: 0.06272654980421066 	 loss mean: 137.5478057861328
nll mean: 137.55661010742188 	 kl mean: 0.06272654980421066 	 loss mean: 137.61932373046875
nll mean: 137.51046752929688 	 kl mean: 0.06272654980421066 	 loss mean: 137.57318115234375
nll mean: 137.56085205078125 	 kl mean: 0.06272654980421066 	 loss mean: 137.62356567382812


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
 30%|███       | 3/10 [00:00<00:00, 22.38it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.11it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.97it/s][A

nll mean: 137.6197052001953 	 kl mean: 0.06272654980421066 	 loss mean: 137.68243408203125
nll mean: 137.5399169921875 	 kl mean: 0.06272654980421066 	 loss mean: 137.60264587402344
nll mean: 137.53663635253906 	 kl mean: 0.06272654980421066 	 loss mean: 137.599365234375
nll mean: 137.53387451171875 	 kl mean: 0.06272654980421066 	 loss mean: 137.59658813476562
nll mean: 137.56573486328125 	 kl mean: 0.06272654980421066 	 loss mean: 137.62844848632812


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
100%|██████████| 10/10 [00:00<00:00, 21.82it/s][A
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s]
 30%|███       | 3/10 [00:00<00:00, 25.00it/s][A

nll mean: 137.5858612060547 	 kl mean: 0.06272654980421066 	 loss mean: 137.64859008789062
nll mean: 124.11647033691406 	 kl mean: 0.06025665998458862 	 loss mean: 124.17672729492188
nll mean: 124.13252258300781 	 kl mean: 0.06025665998458862 	 loss mean: 124.19277954101562
nll mean: 124.14842987060547 	 kl mean: 0.06025665998458862 	 loss mean: 124.20868682861328
nll mean: 124.0612564086914 	 kl mean: 0.06025665998458862 	 loss mean: 124.12150573730469


                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.88it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:14,  1.88it/s]
 30%|███       | 3/10 [00:00<00:00, 25.00it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:14,  1.88it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:14,  1.88it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:14,  1.88it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.79it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.62it/s][A

nll mean: 124.13729858398438 	 kl mean: 0.06025665998458862 	 loss mean: 124.19754791259766
nll mean: 124.18023681640625 	 kl mean: 0.06025665998458862 	 loss mean: 124.2405014038086
nll mean: 124.23651123046875 	 kl mean: 0.06025665998458862 	 loss mean: 124.2967758178711
nll mean: 124.14450073242188 	 kl mean: 0.06025665998458862 	 loss mean: 124.20475769042969
nll mean: 124.23180389404297 	 kl mean: 0.06025665998458862 	 loss mean: 124.29206085205078


                                               
 26%|██▋       | 10/38 [00:06<00:14,  1.88it/s]
100%|██████████| 10/10 [00:00<00:00, 24.46it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  2.02it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.02it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.02it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.02it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.02it/s]
 30%|███       | 3/10 [00:00<00:00, 21.96it/s][A

nll mean: 124.08909606933594 	 kl mean: 0.06025665998458862 	 loss mean: 124.14934539794922
nll mean: 147.4423828125 	 kl mean: 0.0646090880036354 	 loss mean: 147.5070037841797
nll mean: 147.4205780029297 	 kl mean: 0.0646090880036354 	 loss mean: 147.48519897460938
nll mean: 147.27684020996094 	 kl mean: 0.0646090880036354 	 loss mean: 147.34144592285156
nll mean: 147.34243774414062 	 kl mean: 0.0646090880036354 	 loss mean: 147.4070587158203


                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.02it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.02it/s]
 30%|███       | 3/10 [00:00<00:00, 21.96it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.02it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.02it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.02it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.70it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.41it/s][A

nll mean: 147.35617065429688 	 kl mean: 0.0646090880036354 	 loss mean: 147.4207763671875
nll mean: 147.30384826660156 	 kl mean: 0.0646090880036354 	 loss mean: 147.3684539794922
nll mean: 147.31793212890625 	 kl mean: 0.0646090880036354 	 loss mean: 147.38253784179688
nll mean: 147.2677764892578 	 kl mean: 0.0646090880036354 	 loss mean: 147.33238220214844
nll mean: 147.30313110351562 	 kl mean: 0.0646090880036354 	 loss mean: 147.36773681640625


                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.02it/s]
100%|██████████| 10/10 [00:00<00:00, 21.26it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.75it/s][A

nll mean: 147.32461547851562 	 kl mean: 0.0646090880036354 	 loss mean: 147.38922119140625
nll mean: 123.89619445800781 	 kl mean: 0.06286722421646118 	 loss mean: 123.95906066894531
nll mean: 123.83381652832031 	 kl mean: 0.06286722421646118 	 loss mean: 123.89668273925781


                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s]
                                               [A
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s]
 20%|██        | 2/10 [00:00<00:00, 12.75it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s]
 40%|████      | 4/10 [00:00<00:00, 12.67it/s][A

nll mean: 123.89946746826172 	 kl mean: 0.06286722421646118 	 loss mean: 123.96234130859375
nll mean: 123.87144470214844 	 kl mean: 0.06286722421646118 	 loss mean: 123.93431091308594
nll mean: 123.9591293334961 	 kl mean: 0.06286722421646118 	 loss mean: 124.0219955444336


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s]
 40%|████      | 4/10 [00:00<00:00, 12.67it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.58it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.57it/s][A

nll mean: 123.97117614746094 	 kl mean: 0.06286722421646118 	 loss mean: 124.03404235839844
nll mean: 123.90400695800781 	 kl mean: 0.06286722421646118 	 loss mean: 123.96687316894531
nll mean: 123.83208465576172 	 kl mean: 0.06286722421646118 	 loss mean: 123.89495086669922


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.57it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.49it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 123.93785858154297 	 kl mean: 0.06286722421646118 	 loss mean: 124.00071716308594
nll mean: 123.90412139892578 	 kl mean: 0.06286722421646118 	 loss mean: 123.96699523925781
nll mean: 166.0758819580078 	 kl mean: 0.06920356303453445 	 loss mean: 166.14508056640625


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 20%|██        | 2/10 [00:00<00:00, 10.02it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.94it/s][A

nll mean: 166.08599853515625 	 kl mean: 0.06920356303453445 	 loss mean: 166.15521240234375
nll mean: 166.0648956298828 	 kl mean: 0.06920356303453445 	 loss mean: 166.13409423828125


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00,  9.94it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]

nll mean: 166.17428588867188 	 kl mean: 0.06920356303453445 	 loss mean: 166.24346923828125
nll mean: 166.01498413085938 	 kl mean: 0.06920356303453445 	 loss mean: 166.08419799804688
nll mean: 166.18533325195312 	 kl mean: 0.06920356303453445 	 loss mean: 166.25453186035156



 40%|████      | 4/10 [00:00<00:00,  9.89it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.94it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.92it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.92it/s][A

nll mean: 166.13381958007812 	 kl mean: 0.06920356303453445 	 loss mean: 166.20303344726562
nll mean: 166.16262817382812 	 kl mean: 0.06920356303453445 	 loss mean: 166.23184204101562


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.92it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.90it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.90it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 166.0655517578125 	 kl mean: 0.06920356303453445 	 loss mean: 166.134765625
nll mean: 166.19400024414062 	 kl mean: 0.06920356303453445 	 loss mean: 166.26321411132812
nll mean: 139.49034118652344 	 kl mean: 0.07271147519350052 	 loss mean: 139.56304931640625


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.61it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 18.35it/s][A

nll mean: 139.48834228515625 	 kl mean: 0.07271147519350052 	 loss mean: 139.56105041503906
nll mean: 139.43606567382812 	 kl mean: 0.07271147519350052 	 loss mean: 139.5087890625
nll mean: 139.5142364501953 	 kl mean: 0.07271147519350052 	 loss mean: 139.58694458007812
nll mean: 139.4258270263672 	 kl mean: 0.07271147519350052 	 loss mean: 139.49855041503906


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 18.35it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 18.32it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 18.20it/s][A

nll mean: 139.51925659179688 	 kl mean: 0.07271147519350052 	 loss mean: 139.5919647216797
nll mean: 139.4827117919922 	 kl mean: 0.07271147519350052 	 loss mean: 139.555419921875
nll mean: 139.55404663085938 	 kl mean: 0.07271147519350052 	 loss mean: 139.6267547607422
nll mean: 139.43569946289062 	 kl mean: 0.07271147519350052 	 loss mean: 139.50839233398438


                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 18.20it/s][A
100%|██████████| 10/10 [00:00<00:00, 18.04it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.72it/s][A

nll mean: 139.47708129882812 	 kl mean: 0.07271147519350052 	 loss mean: 139.5498046875
nll mean: 149.18092346191406 	 kl mean: 0.06946054100990295 	 loss mean: 149.25039672851562
nll mean: 149.216796875 	 kl mean: 0.06946054100990295 	 loss mean: 149.2862548828125


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 20%|██        | 2/10 [00:00<00:00, 10.72it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 40%|████      | 4/10 [00:00<00:00, 10.73it/s][A

nll mean: 149.23245239257812 	 kl mean: 0.06946054100990295 	 loss mean: 149.30191040039062
nll mean: 149.29104614257812 	 kl mean: 0.06946054100990295 	 loss mean: 149.36050415039062
nll mean: 149.23150634765625 	 kl mean: 0.06946054100990295 	 loss mean: 149.30096435546875


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 40%|████      | 4/10 [00:00<00:00, 10.73it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.72it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.75it/s][A

nll mean: 149.09701538085938 	 kl mean: 0.06946054100990295 	 loss mean: 149.16647338867188
nll mean: 149.2017364501953 	 kl mean: 0.06946054100990295 	 loss mean: 149.27120971679688
nll mean: 149.14710998535156 	 kl mean: 0.06946054100990295 	 loss mean: 149.21658325195312


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.75it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.75it/s][A
 42%|████▏     | 16/38 [00:09<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 149.23611450195312 	 kl mean: 0.06946054100990295 	 loss mean: 149.3055877685547
nll mean: 149.13877868652344 	 kl mean: 0.06946054100990295 	 loss mean: 149.20822143554688
nll mean: 148.428466796875 	 kl mean: 0.07599835097789764 	 loss mean: 148.50448608398438
nll mean: 148.49932861328125 	 kl mean: 0.07599835097789764 	 loss mean: 148.57534790039062


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 25.00it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.92it/s][A

nll mean: 148.553955078125 	 kl mean: 0.07599835097789764 	 loss mean: 148.62994384765625
nll mean: 148.50643920898438 	 kl mean: 0.07599835097789764 	 loss mean: 148.5824432373047
nll mean: 148.54586791992188 	 kl mean: 0.07599835097789764 	 loss mean: 148.6218719482422
nll mean: 148.5349884033203 	 kl mean: 0.07599835097789764 	 loss mean: 148.61099243164062
nll mean: 148.4622802734375 	 kl mean: 0.07599835097789764 	 loss mean: 148.5382843017578


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.92it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
100%|██████████| 10/10 [00:00<00:00, 24.72it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 148.6034698486328 	 kl mean: 0.07599835097789764 	 loss mean: 148.67947387695312
nll mean: 148.52847290039062 	 kl mean: 0.07599835097789764 	 loss mean: 148.60447692871094
nll mean: 148.47579956054688 	 kl mean: 0.07599835097789764 	 loss mean: 148.55178833007812
nll mean: 138.4619140625 	 kl mean: 0.0627480149269104 	 loss mean: 138.524658203125
nll mean: 138.40008544921875 	 kl mean: 0.0627480149269104 	 loss mean: 138.4628448486328


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 25.40it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.30it/s]

nll mean: 138.25323486328125 	 kl mean: 0.0627480149269104 	 loss mean: 138.31597900390625
nll mean: 138.311279296875 	 kl mean: 0.0627480149269104 	 loss mean: 138.3740234375
nll mean: 138.39181518554688 	 kl mean: 0.0627480149269104 	 loss mean: 138.45455932617188
nll mean: 138.36773681640625 	 kl mean: 0.0627480149269104 	 loss mean: 138.43048095703125
nll mean: 138.33798217773438 	 kl mean: 0.0627480149269104 	 loss mean: 138.40074157714844
nll mean: 138.29681396484375 	 kl mean: 0.0627480149269104 	 loss mean: 138.35955810546875


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.30it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
100%|██████████| 10/10 [00:00<00:00, 25.11it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 138.34072875976562 	 kl mean: 0.0627480149269104 	 loss mean: 138.40347290039062
nll mean: 138.378662109375 	 kl mean: 0.0627480149269104 	 loss mean: 138.44142150878906
nll mean: 136.4761962890625 	 kl mean: 0.06805069744586945 	 loss mean: 136.54425048828125


                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 20%|██        | 2/10 [00:00<00:00, 12.32it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.56it/s][A

nll mean: 136.49014282226562 	 kl mean: 0.06805069744586945 	 loss mean: 136.55819702148438
nll mean: 136.51611328125 	 kl mean: 0.06805069744586945 	 loss mean: 136.58416748046875
nll mean: 136.5689697265625 	 kl mean: 0.06805069744586945 	 loss mean: 136.63699340820312


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 40%|████      | 4/10 [00:00<00:00, 12.56it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.61it/s][A

nll mean: 136.57884216308594 	 kl mean: 0.06805069744586945 	 loss mean: 136.6468963623047
nll mean: 136.5385284423828 	 kl mean: 0.06805069744586945 	 loss mean: 136.60658264160156
nll mean: 136.40066528320312 	 kl mean: 0.06805069744586945 	 loss mean: 136.4687042236328


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.61it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.78it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 136.45816040039062 	 kl mean: 0.06805069744586945 	 loss mean: 136.52621459960938
nll mean: 136.55462646484375 	 kl mean: 0.06805069744586945 	 loss mean: 136.62266540527344
nll mean: 136.5122528076172 	 kl mean: 0.06805069744586945 	 loss mean: 136.58029174804688


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 12.90it/s][A

nll mean: 154.38397216796875 	 kl mean: 0.0626407265663147 	 loss mean: 154.4466094970703
nll mean: 154.33755493164062 	 kl mean: 0.0626407265663147 	 loss mean: 154.40017700195312
nll mean: 154.3109893798828 	 kl mean: 0.0626407265663147 	 loss mean: 154.37362670898438


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 12.90it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
 40%|████      | 4/10 [00:00<00:00, 12.86it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.71it/s][A

nll mean: 154.2456817626953 	 kl mean: 0.0626407265663147 	 loss mean: 154.30831909179688
nll mean: 154.29905700683594 	 kl mean: 0.0626407265663147 	 loss mean: 154.3616943359375
nll mean: 154.34686279296875 	 kl mean: 0.0626407265663147 	 loss mean: 154.40951538085938


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.71it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.79it/s][A

nll mean: 154.35568237304688 	 kl mean: 0.0626407265663147 	 loss mean: 154.41830444335938
nll mean: 154.2799835205078 	 kl mean: 0.0626407265663147 	 loss mean: 154.34262084960938
nll mean: 154.26417541503906 	 kl mean: 0.0626407265663147 	 loss mean: 154.32679748535156


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.79it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.74it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 13.01it/s][A

nll mean: 154.32923889160156 	 kl mean: 0.0626407265663147 	 loss mean: 154.39187622070312
nll mean: 160.82388305664062 	 kl mean: 0.07073189318180084 	 loss mean: 160.89462280273438
nll mean: 160.85073852539062 	 kl mean: 0.07073189318180084 	 loss mean: 160.92147827148438


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
 20%|██        | 2/10 [00:00<00:00, 13.01it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
 40%|████      | 4/10 [00:00<00:00, 12.81it/s][A

nll mean: 160.81039428710938 	 kl mean: 0.07073189318180084 	 loss mean: 160.88113403320312
nll mean: 160.84799194335938 	 kl mean: 0.07073189318180084 	 loss mean: 160.91871643066406
nll mean: 160.72882080078125 	 kl mean: 0.07073189318180084 	 loss mean: 160.799560546875


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
 40%|████      | 4/10 [00:00<00:00, 12.81it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.72it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.54it/s][A

nll mean: 160.81610107421875 	 kl mean: 0.07073189318180084 	 loss mean: 160.88681030273438
nll mean: 160.88870239257812 	 kl mean: 0.07073189318180084 	 loss mean: 160.9594268798828
nll mean: 160.79873657226562 	 kl mean: 0.07073189318180084 	 loss mean: 160.86947631835938


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.47it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.54it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.47it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 160.7915802001953 	 kl mean: 0.07073189318180084 	 loss mean: 160.8623046875
nll mean: 160.7840576171875 	 kl mean: 0.07073189318180084 	 loss mean: 160.8547821044922
nll mean: 123.51459503173828 	 kl mean: 0.06897640228271484 	 loss mean: 123.58356475830078


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 10.23it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.24it/s][A

nll mean: 123.54558563232422 	 kl mean: 0.06897640228271484 	 loss mean: 123.61456298828125
nll mean: 123.57647705078125 	 kl mean: 0.06897640228271484 	 loss mean: 123.64545440673828
nll mean: 123.58290100097656 	 kl mean: 0.06897640228271484 	 loss mean: 123.65187072753906


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 40%|████      | 4/10 [00:00<00:00, 10.24it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.25it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.12it/s][A

nll mean: 123.5606460571289 	 kl mean: 0.06897640228271484 	 loss mean: 123.62962341308594
nll mean: 123.50518798828125 	 kl mean: 0.06897640228271484 	 loss mean: 123.57417297363281
nll mean: 123.54521179199219 	 kl mean: 0.06897640228271484 	 loss mean: 123.61418914794922


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.12it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.03it/s][A

nll mean: 123.57684326171875 	 kl mean: 0.06897640228271484 	 loss mean: 123.64581298828125
nll mean: 123.47712707519531 	 kl mean: 0.06897640228271484 	 loss mean: 123.54610443115234
nll mean: 123.66088104248047 	 kl mean: 0.06897640228271484 	 loss mean: 123.72984313964844



100%|██████████| 10/10 [00:00<00:00, 10.12it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 31.92it/s][A

nll mean: 112.17095947265625 	 kl mean: 0.05707752704620361 	 loss mean: 112.22803497314453
nll mean: 112.19266510009766 	 kl mean: 0.05707752704620361 	 loss mean: 112.24974822998047
nll mean: 112.11569213867188 	 kl mean: 0.05707752704620361 	 loss mean: 112.17277526855469
nll mean: 112.12925720214844 	 kl mean: 0.05707752704620361 	 loss mean: 112.18632507324219
nll mean: 112.14373016357422 	 kl mean: 0.05707752704620361 	 loss mean: 112.2008056640625
nll mean: 112.06793212890625 	 kl mean: 0.05707752704620361 	 loss mean: 112.12500762939453
nll mean: 112.25843811035156 	 kl mean: 0.05707752704620361 	 loss mean: 112.31552124023438


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 31.92it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
100%|██████████| 10/10 [00:00<00:00, 31.27it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 112.19194793701172 	 kl mean: 0.05707752704620361 	 loss mean: 112.2490234375
nll mean: 112.05767822265625 	 kl mean: 0.05707752704620361 	 loss mean: 112.11474609375
nll mean: 112.16316223144531 	 kl mean: 0.05707752704620361 	 loss mean: 112.22024536132812
nll mean: 162.57078552246094 	 kl mean: 0.06350196897983551 	 loss mean: 162.63427734375


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
 20%|██        | 2/10 [00:00<00:00, 14.60it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.54it/s][A

nll mean: 162.48245239257812 	 kl mean: 0.06350196897983551 	 loss mean: 162.54595947265625
nll mean: 162.58201599121094 	 kl mean: 0.06350196897983551 	 loss mean: 162.64552307128906
nll mean: 162.5925750732422 	 kl mean: 0.06350196897983551 	 loss mean: 162.65606689453125


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
 40%|████      | 4/10 [00:00<00:00, 14.54it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.46it/s][A

nll mean: 162.64846801757812 	 kl mean: 0.06350196897983551 	 loss mean: 162.7119598388672
nll mean: 162.5204620361328 	 kl mean: 0.06350196897983551 	 loss mean: 162.58395385742188
nll mean: 162.58074951171875 	 kl mean: 0.06350196897983551 	 loss mean: 162.64425659179688


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.46it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.41it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.40it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 162.58676147460938 	 kl mean: 0.06350196897983551 	 loss mean: 162.6502685546875
nll mean: 162.6085205078125 	 kl mean: 0.06350196897983551 	 loss mean: 162.67202758789062
nll mean: 162.59234619140625 	 kl mean: 0.06350196897983551 	 loss mean: 162.65585327148438
nll mean: 127.12340545654297 	 kl mean: 0.06775696575641632 	 loss mean: 127.191162109375


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
 30%|███       | 3/10 [00:00<00:00, 21.44it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.33it/s][A

nll mean: 127.04842376708984 	 kl mean: 0.06775696575641632 	 loss mean: 127.11617279052734
nll mean: 126.99639892578125 	 kl mean: 0.06775696575641632 	 loss mean: 127.06415557861328
nll mean: 126.93598937988281 	 kl mean: 0.06775696575641632 	 loss mean: 127.00373840332031
nll mean: 127.05216979980469 	 kl mean: 0.06775696575641632 	 loss mean: 127.11993408203125
nll mean: 126.93572235107422 	 kl mean: 0.06775696575641632 	 loss mean: 127.00347900390625


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.33it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
100%|██████████| 10/10 [00:00<00:00, 21.04it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 127.02350616455078 	 kl mean: 0.06775696575641632 	 loss mean: 127.09126281738281
nll mean: 127.1029052734375 	 kl mean: 0.06775696575641632 	 loss mean: 127.170654296875
nll mean: 126.95497131347656 	 kl mean: 0.06775696575641632 	 loss mean: 127.0227279663086
nll mean: 126.9869384765625 	 kl mean: 0.06775696575641632 	 loss mean: 127.05469512939453


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.63it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.63it/s]
 20%|██        | 2/10 [00:00<00:00, 14.38it/s][A

nll mean: 120.567138671875 	 kl mean: 0.0602090023458004 	 loss mean: 120.62734985351562
nll mean: 120.58648681640625 	 kl mean: 0.0602090023458004 	 loss mean: 120.64669799804688
nll mean: 120.51354217529297 	 kl mean: 0.0602090023458004 	 loss mean: 120.57374572753906


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.63it/s]
 20%|██        | 2/10 [00:00<00:00, 14.38it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.63it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
 40%|████      | 4/10 [00:00<00:00, 14.45it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.45it/s][A

nll mean: 120.50929260253906 	 kl mean: 0.0602090023458004 	 loss mean: 120.56950378417969
nll mean: 120.53204345703125 	 kl mean: 0.0602090023458004 	 loss mean: 120.59225463867188
nll mean: 120.53994750976562 	 kl mean: 0.0602090023458004 	 loss mean: 120.60015106201172


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.45it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.47it/s][A

nll mean: 120.43209075927734 	 kl mean: 0.0602090023458004 	 loss mean: 120.49230194091797
nll mean: 120.45579528808594 	 kl mean: 0.0602090023458004 	 loss mean: 120.5159912109375
nll mean: 120.61206817626953 	 kl mean: 0.0602090023458004 	 loss mean: 120.67227172851562


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.47it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.46it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.57it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.57it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.57it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.57it/s]
 30%|███       | 3/10 [00:00<00:00, 23.06it/s][A

nll mean: 120.50177001953125 	 kl mean: 0.0602090023458004 	 loss mean: 120.56196594238281
nll mean: 87.87098693847656 	 kl mean: 0.09564083814620972 	 loss mean: 87.96662902832031
nll mean: 87.72538757324219 	 kl mean: 0.09564083814620972 	 loss mean: 87.82102966308594
nll mean: 87.78868103027344 	 kl mean: 0.09564083814620972 	 loss mean: 87.88432312011719
nll mean: 87.90133666992188 	 kl mean: 0.09564083814620972 	 loss mean: 87.99697875976562


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.57it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.57it/s]
 30%|███       | 3/10 [00:00<00:00, 23.06it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.57it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.57it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.77it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.58it/s][A

nll mean: 87.93521118164062 	 kl mean: 0.09564083814620972 	 loss mean: 88.03085327148438
nll mean: 87.80352020263672 	 kl mean: 0.09564083814620972 	 loss mean: 87.89916229248047
nll mean: 87.7906723022461 	 kl mean: 0.09564083814620972 	 loss mean: 87.88631439208984
nll mean: 87.8016357421875 	 kl mean: 0.09564083814620972 	 loss mean: 87.89727783203125
nll mean: 87.86702728271484 	 kl mean: 0.09564083814620972 	 loss mean: 87.9626693725586


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.57it/s]
100%|██████████| 10/10 [00:00<00:00, 22.54it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.90it/s][A

nll mean: 87.91404724121094 	 kl mean: 0.09564083814620972 	 loss mean: 88.00968933105469
nll mean: 113.91343688964844 	 kl mean: 0.058488715440034866 	 loss mean: 113.971923828125
nll mean: 113.89286041259766 	 kl mean: 0.058488715440034866 	 loss mean: 113.95134735107422
nll mean: 113.79945373535156 	 kl mean: 0.058488715440034866 	 loss mean: 113.85794067382812
nll mean: 113.7844467163086 	 kl mean: 0.058488715440034866 	 loss mean: 113.84294128417969


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.90it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.97it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.00it/s][A

nll mean: 113.88227844238281 	 kl mean: 0.058488715440034866 	 loss mean: 113.94076538085938
nll mean: 113.8718032836914 	 kl mean: 0.058488715440034866 	 loss mean: 113.9302978515625
nll mean: 113.86244201660156 	 kl mean: 0.058488715440034866 	 loss mean: 113.92092895507812
nll mean: 113.73135375976562 	 kl mean: 0.058488715440034866 	 loss mean: 113.78984069824219
nll mean: 113.77180480957031 	 kl mean: 0.058488715440034866 	 loss mean: 113.8302993774414


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
100%|██████████| 10/10 [00:00<00:00, 21.99it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.70it/s][A

nll mean: 113.84393310546875 	 kl mean: 0.058488715440034866 	 loss mean: 113.90242767333984
nll mean: 125.50508117675781 	 kl mean: 0.061662234365940094 	 loss mean: 125.56674194335938
nll mean: 125.58370208740234 	 kl mean: 0.061662234365940094 	 loss mean: 125.64535522460938


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.70it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 40%|████      | 4/10 [00:00<00:00, 12.58it/s][A

nll mean: 125.48196411132812 	 kl mean: 0.061662234365940094 	 loss mean: 125.54362487792969
nll mean: 125.42686462402344 	 kl mean: 0.061662234365940094 	 loss mean: 125.48851776123047
nll mean: 125.51826477050781 	 kl mean: 0.061662234365940094 	 loss mean: 125.5799331665039


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 40%|████      | 4/10 [00:00<00:00, 12.58it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.53it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A

nll mean: 125.46861267089844 	 kl mean: 0.061662234365940094 	 loss mean: 125.53026580810547
nll mean: 125.43119049072266 	 kl mean: 0.061662234365940094 	 loss mean: 125.49285125732422
nll mean: 125.4608154296875 	 kl mean: 0.061662234365940094 	 loss mean: 125.52247619628906


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.49it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 125.51840209960938 	 kl mean: 0.061662234365940094 	 loss mean: 125.58007049560547
nll mean: 125.5770263671875 	 kl mean: 0.061662234365940094 	 loss mean: 125.63868713378906
nll mean: 66.48542785644531 	 kl mean: 0.055367447435855865 	 loss mean: 66.54080200195312


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 10.35it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.31it/s][A

nll mean: 66.46593475341797 	 kl mean: 0.055367447435855865 	 loss mean: 66.52130126953125
nll mean: 66.64744567871094 	 kl mean: 0.055367447435855865 	 loss mean: 66.70280456542969
nll mean: 66.46268463134766 	 kl mean: 0.055367447435855865 	 loss mean: 66.51805114746094


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 40%|████      | 4/10 [00:00<00:00, 10.31it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.26it/s][A

nll mean: 66.43954467773438 	 kl mean: 0.055367447435855865 	 loss mean: 66.49491882324219
nll mean: 66.55937957763672 	 kl mean: 0.055367447435855865 	 loss mean: 66.61474609375
nll mean: 66.57093048095703 	 kl mean: 0.055367447435855865 	 loss mean: 66.62629699707031


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.26it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.26it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.25it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 66.50375366210938 	 kl mean: 0.055367447435855865 	 loss mean: 66.55912017822266
nll mean: 66.51258850097656 	 kl mean: 0.055367447435855865 	 loss mean: 66.56795501708984
nll mean: 66.54597473144531 	 kl mean: 0.055367447435855865 	 loss mean: 66.6013412475586


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 12.60it/s][A

nll mean: 109.84574890136719 	 kl mean: 0.0717490091919899 	 loss mean: 109.91749572753906
nll mean: 109.9456787109375 	 kl mean: 0.0717490091919899 	 loss mean: 110.01741790771484
nll mean: 109.93623352050781 	 kl mean: 0.0717490091919899 	 loss mean: 110.00798034667969


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 12.60it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 40%|████      | 4/10 [00:00<00:00, 12.69it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.80it/s][A

nll mean: 109.963134765625 	 kl mean: 0.0717490091919899 	 loss mean: 110.03488159179688
nll mean: 109.89614868164062 	 kl mean: 0.0717490091919899 	 loss mean: 109.96790313720703
nll mean: 109.85579681396484 	 kl mean: 0.0717490091919899 	 loss mean: 109.92755126953125


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.80it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.85it/s][A

nll mean: 109.80250549316406 	 kl mean: 0.0717490091919899 	 loss mean: 109.874267578125
nll mean: 109.95008850097656 	 kl mean: 0.0717490091919899 	 loss mean: 110.02184295654297
nll mean: 109.88313293457031 	 kl mean: 0.0717490091919899 	 loss mean: 109.95487976074219


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.85it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.99it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 109.78449249267578 	 kl mean: 0.0717490091919899 	 loss mean: 109.85623931884766
nll mean: 143.9337158203125 	 kl mean: 0.07611703127622604 	 loss mean: 144.00982666015625
nll mean: 144.06460571289062 	 kl mean: 0.07611703127622604 	 loss mean: 144.14071655273438



                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s]
 20%|██        | 2/10 [00:00<00:00, 10.22it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s]
 30%|███       | 3/10 [00:00<00:00, 10.12it/s][A
                                               [A

nll mean: 143.89501953125 	 kl mean: 0.07611703127622604 	 loss mean: 143.97113037109375
nll mean: 143.9292755126953 	 kl mean: 0.07611703127622604 	 loss mean: 144.00540161132812



 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s]
 40%|████      | 4/10 [00:00<00:00, 10.06it/s][A
                                               [A
[A                                           

nll mean: 143.98190307617188 	 kl mean: 0.07611703127622604 	 loss mean: 144.05801391601562
nll mean: 143.8691864013672 	 kl mean: 0.07611703127622604 	 loss mean: 143.9453125


 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.05it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.99it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 10.04it/s][A

nll mean: 143.96505737304688 	 kl mean: 0.07611703127622604 	 loss mean: 144.04116821289062
nll mean: 143.84420776367188 	 kl mean: 0.07611703127622604 	 loss mean: 143.9203338623047
nll mean: 143.91238403320312 	 kl mean: 0.07611703127622604 	 loss mean: 143.98849487304688


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s]
100%|██████████| 10/10 [00:00<00:00, 10.06it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
 30%|███       | 3/10 [00:00<00:00, 26.14it/s][A

nll mean: 143.9786834716797 	 kl mean: 0.07611703127622604 	 loss mean: 144.0548095703125
nll mean: 68.56999206542969 	 kl mean: 0.055219605565071106 	 loss mean: 68.62521362304688
nll mean: 68.65315246582031 	 kl mean: 0.055219605565071106 	 loss mean: 68.70835876464844
nll mean: 68.606689453125 	 kl mean: 0.055219605565071106 	 loss mean: 68.66191101074219
nll mean: 68.56243896484375 	 kl mean: 0.055219605565071106 	 loss mean: 68.61766052246094
nll mean: 68.54347229003906 	 kl mean: 0.055219605565071106 	 loss mean: 68.59869384765625


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
 30%|███       | 3/10 [00:00<00:00, 26.14it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.99it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
100%|██████████| 10/10 [00:00<00:00, 25.80it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 68.61306762695312 	 kl mean: 0.055219605565071106 	 loss mean: 68.66828155517578
nll mean: 68.613525390625 	 kl mean: 0.055219605565071106 	 loss mean: 68.66873931884766
nll mean: 68.593994140625 	 kl mean: 0.055219605565071106 	 loss mean: 68.64921569824219
nll mean: 68.56687927246094 	 kl mean: 0.055219605565071106 	 loss mean: 68.62210083007812
nll mean: 68.59556579589844 	 kl mean: 0.055219605565071106 	 loss mean: 68.65078735351562


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
 30%|███       | 3/10 [00:00<00:00, 21.94it/s][A

nll mean: 123.74195861816406 	 kl mean: 0.06819051504135132 	 loss mean: 123.81015014648438
nll mean: 123.65774536132812 	 kl mean: 0.06819051504135132 	 loss mean: 123.7259292602539
nll mean: 123.6173324584961 	 kl mean: 0.06819051504135132 	 loss mean: 123.68551635742188
nll mean: 123.62171936035156 	 kl mean: 0.06819051504135132 	 loss mean: 123.68991088867188
nll mean: 123.65384674072266 	 kl mean: 0.06819051504135132 	 loss mean: 123.72203063964844


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
 30%|███       | 3/10 [00:00<00:00, 21.94it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.92it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
100%|██████████| 10/10 [00:00<00:00, 21.87it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 123.63373565673828 	 kl mean: 0.06819051504135132 	 loss mean: 123.70191955566406
nll mean: 123.6890869140625 	 kl mean: 0.06819051504135132 	 loss mean: 123.75727844238281
nll mean: 123.57038879394531 	 kl mean: 0.06819051504135132 	 loss mean: 123.63858032226562
nll mean: 123.59854888916016 	 kl mean: 0.06819051504135132 	 loss mean: 123.666748046875
nll mean: 123.66431427001953 	 kl mean: 0.06819051504135132 	 loss mean: 123.73250579833984


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 12.63it/s][A

nll mean: 125.53445434570312 	 kl mean: 0.05916030332446098 	 loss mean: 125.59361267089844
nll mean: 125.52212524414062 	 kl mean: 0.05916030332446098 	 loss mean: 125.58129119873047
nll mean: 125.59938049316406 	 kl mean: 0.05916030332446098 	 loss mean: 125.65853881835938


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 12.63it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s]
 40%|████      | 4/10 [00:00<00:00, 12.69it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.75it/s][A

nll mean: 125.5211181640625 	 kl mean: 0.05916030332446098 	 loss mean: 125.58027648925781
nll mean: 125.56976318359375 	 kl mean: 0.05916030332446098 	 loss mean: 125.62891387939453
nll mean: 125.50094604492188 	 kl mean: 0.05916030332446098 	 loss mean: 125.56011199951172


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.75it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.83it/s][A

nll mean: 125.5457763671875 	 kl mean: 0.05916030332446098 	 loss mean: 125.60493469238281
nll mean: 125.5183334350586 	 kl mean: 0.05916030332446098 	 loss mean: 125.5774917602539
nll mean: 125.56777954101562 	 kl mean: 0.05916030332446098 	 loss mean: 125.62693786621094


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.83it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.77it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.77it/s][A

nll mean: 125.62114715576172 	 kl mean: 0.05916030332446098 	 loss mean: 125.6802978515625
nll mean: 118.18119812011719 	 kl mean: 0.07356034219264984 	 loss mean: 118.2547607421875
nll mean: 118.09618377685547 	 kl mean: 0.07356034219264984 	 loss mean: 118.16974639892578


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
 20%|██        | 2/10 [00:00<00:00, 10.77it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 10.70it/s][A

nll mean: 118.05084228515625 	 kl mean: 0.07356034219264984 	 loss mean: 118.12440490722656
nll mean: 118.05699157714844 	 kl mean: 0.07356034219264984 	 loss mean: 118.13055419921875
nll mean: 118.11882019042969 	 kl mean: 0.07356034219264984 	 loss mean: 118.19237518310547


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 10.70it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.49it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.49it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.69it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.73it/s][A

nll mean: 118.14256286621094 	 kl mean: 0.07356034219264984 	 loss mean: 118.21612548828125
nll mean: 118.20655822753906 	 kl mean: 0.07356034219264984 	 loss mean: 118.2801284790039
nll mean: 118.06926727294922 	 kl mean: 0.07356034219264984 	 loss mean: 118.14283752441406


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.49it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.49it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.73it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.70it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.17830657958984 	 kl mean: 0.07356034219264984 	 loss mean: 118.25187683105469
nll mean: 118.1772689819336 	 kl mean: 0.07356034219264984 	 loss mean: 118.25082397460938
nll mean: 117.79460906982422 	 kl mean: 0.07238086313009262 	 loss mean: 117.86698913574219
nll mean: 117.60517883300781 	 kl mean: 0.07238086313009262 	 loss mean: 117.67755889892578


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 23.32it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.92it/s][A

nll mean: 117.72551727294922 	 kl mean: 0.07238086313009262 	 loss mean: 117.79789733886719
nll mean: 117.68975830078125 	 kl mean: 0.07238086313009262 	 loss mean: 117.76213836669922
nll mean: 117.68260955810547 	 kl mean: 0.07238086313009262 	 loss mean: 117.75498962402344
nll mean: 117.70809936523438 	 kl mean: 0.07238086313009262 	 loss mean: 117.78047943115234
nll mean: 117.75599670410156 	 kl mean: 0.07238086313009262 	 loss mean: 117.82838439941406


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.92it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
100%|██████████| 10/10 [00:00<00:00, 22.42it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.52it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.52it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.52it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 117.64969635009766 	 kl mean: 0.07238086313009262 	 loss mean: 117.72207641601562
nll mean: 117.724609375 	 kl mean: 0.07238086313009262 	 loss mean: 117.79698181152344
nll mean: 117.81430053710938 	 kl mean: 0.07238086313009262 	 loss mean: 117.88667297363281
nll mean: 91.05613708496094 	 kl mean: 0.06083798408508301 	 loss mean: 91.1169662475586
nll mean: 91.0028076171875 	 kl mean: 0.06083798408508301 	 loss mean: 91.06364440917969
nll mean: 91.05101013183594 	 kl mean: 0.06083798408508301 	 loss mean: 91.1118392944336


                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:23<00:00,  1.52it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.52it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.52it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.52it/s]
 40%|████      | 4/10 [00:00<00:00, 30.86it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.52it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.52it/s]
100%|██████████| 10/10 [00:00<00:00, 30.80it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.57it/s]


nll mean: 91.04331970214844 	 kl mean: 0.06083798408508301 	 loss mean: 91.1041488647461
nll mean: 91.04742431640625 	 kl mean: 0.06083798408508301 	 loss mean: 91.10826873779297
nll mean: 91.03228759765625 	 kl mean: 0.06083798408508301 	 loss mean: 91.09313201904297
nll mean: 91.08650207519531 	 kl mean: 0.06083798408508301 	 loss mean: 91.1473388671875
nll mean: 90.98594665527344 	 kl mean: 0.06083798408508301 	 loss mean: 91.04679870605469
nll mean: 90.9451904296875 	 kl mean: 0.06083798408508301 	 loss mean: 91.00602722167969
nll mean: 91.08644104003906 	 kl mean: 0.06083798408508301 	 loss mean: 91.14727020263672
Approximate NLL:
tensor(126.7274, device='cuda:0')
Approximate KL:
tensor(0.0670, device='cuda:0')
Testing took 0:00:25.120746


In [10]:
print(vanilla_nlls)

[tensor(126.9970, device='cuda:0'), tensor(127.1339, device='cuda:0'), tensor(127.0737, device='cuda:0'), tensor(126.7274, device='cuda:0')]


# Word dropout

In [11]:
saved_model_files = get_model_filenames('word_dropout_066')
saved_model_files

['results_final/results0/word_dropout_066/models/sentence_vae_6000.pt',
 'results_final/results1/word_dropout_066/models/sentence_vae_4500.pt',
 'results_final/results2/word_dropout_066/models/sentence_vae_6000.pt',
 'results_final/results3/word_dropout_066/models/sentence_vae_6000.pt']

In [12]:
wd_nlls, wd_kls = get_approx_nlls(saved_model_files)

  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 26.18it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].18it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].18it/s][A
                                              

nll mean: 114.40963745117188 	 kl mean: 1.0882575511932373 	 loss mean: 115.49788665771484
nll mean: 114.58032989501953 	 kl mean: 1.0882575511932373 	 loss mean: 115.66859436035156
nll mean: 114.40042114257812 	 kl mean: 1.0882575511932373 	 loss mean: 115.48867797851562
nll mean: 114.36880493164062 	 kl mean: 1.0882575511932373 	 loss mean: 115.45706176757812
nll mean: 114.54505157470703 	 kl mean: 1.0882575511932373 	 loss mean: 115.63330841064453


                                      
  0%|          | 0/38 [00:00<?, ?it/s].18it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.72it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].72it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].72it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].72it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.52it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 25.23it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 114.48126983642578 	 kl mean: 1.0882575511932373 	 loss mean: 115.56952667236328
nll mean: 114.4964370727539 	 kl mean: 1.0882575511932373 	 loss mean: 115.5846939086914
nll mean: 114.47813415527344 	 kl mean: 1.0882575511932373 	 loss mean: 115.56639099121094
nll mean: 114.47491455078125 	 kl mean: 1.0882575511932373 	 loss mean: 115.56317138671875
nll mean: 114.39823913574219 	 kl mean: 1.0882575511932373 	 loss mean: 115.48649597167969



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
 20%|██        | 2/10 [00:00<00:00, 15.06it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s][A

nll mean: 131.3830108642578 	 kl mean: 1.304136037826538 	 loss mean: 132.68716430664062
nll mean: 131.38198852539062 	 kl mean: 1.304136037826538 	 loss mean: 132.68612670898438
nll mean: 131.39602661132812 	 kl mean: 1.304136037826538 	 loss mean: 132.70016479492188



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.70it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.65it/s][A

nll mean: 131.23602294921875 	 kl mean: 1.304136037826538 	 loss mean: 132.5401611328125
nll mean: 131.487060546875 	 kl mean: 1.304136037826538 	 loss mean: 132.7912139892578
nll mean: 131.226318359375 	 kl mean: 1.304136037826538 	 loss mean: 132.53045654296875



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.43it/s][A
                                              
  3%|▎         | 1/38 [00:01<00:14,  2.51it/s][A

nll mean: 131.28814697265625 	 kl mean: 1.304136037826538 	 loss mean: 132.59225463867188
nll mean: 131.431640625 	 kl mean: 1.304136037826538 	 loss mean: 132.73577880859375
nll mean: 131.44354248046875 	 kl mean: 1.304136037826538 	 loss mean: 132.7476806640625



                                              
  3%|▎         | 1/38 [00:01<00:14,  2.51it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.31it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.04it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.04it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.04it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.04it/s]
 30%|███       | 3/10 [00:00<00:00, 25.63it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.04it/s][A


nll mean: 131.2871551513672 	 kl mean: 1.304136037826538 	 loss mean: 132.59127807617188
nll mean: 103.76290893554688 	 kl mean: 1.0861469507217407 	 loss mean: 104.84905242919922
nll mean: 103.88958740234375 	 kl mean: 1.0861469507217407 	 loss mean: 104.97573852539062
nll mean: 103.72383880615234 	 kl mean: 1.0861469507217407 	 loss mean: 104.80998229980469
nll mean: 103.9539566040039 	 kl mean: 1.0861469507217407 	 loss mean: 105.04010009765625


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.04it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.04it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.23it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.04it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.04it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.04it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.92it/s][A

nll mean: 103.89437866210938 	 kl mean: 1.0861469507217407 	 loss mean: 104.98052215576172
nll mean: 103.83901977539062 	 kl mean: 1.0861469507217407 	 loss mean: 104.9251708984375
nll mean: 103.6675796508789 	 kl mean: 1.0861469507217407 	 loss mean: 104.75372314453125
nll mean: 103.71833801269531 	 kl mean: 1.0861469507217407 	 loss mean: 104.80448913574219
nll mean: 103.86280059814453 	 kl mean: 1.0861469507217407 	 loss mean: 104.94894409179688



                                              
100%|██████████| 10/10 [00:00<00:00, 24.65it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.92it/s][A

nll mean: 103.67759704589844 	 kl mean: 1.0861469507217407 	 loss mean: 104.76374053955078
nll mean: 143.14703369140625 	 kl mean: 1.2518671751022339 	 loss mean: 144.39891052246094
nll mean: 142.78273010253906 	 kl mean: 1.2518671751022339 	 loss mean: 144.03460693359375


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
 20%|██        | 2/10 [00:00<00:00, 10.92it/s][A
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
 40%|████      | 4/10 [00:00<00:00, 10.94it/s][A

nll mean: 142.62648010253906 	 kl mean: 1.2518671751022339 	 loss mean: 143.87835693359375
nll mean: 142.77093505859375 	 kl mean: 1.2518671751022339 	 loss mean: 144.02279663085938
nll mean: 142.7499237060547 	 kl mean: 1.2518671751022339 	 loss mean: 144.00180053710938


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.15it/s]
 40%|████      | 4/10 [00:00<00:00, 10.94it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.15it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.15it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.93it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.93it/s][A

nll mean: 142.9202117919922 	 kl mean: 1.2518671751022339 	 loss mean: 144.1720733642578
nll mean: 142.83741760253906 	 kl mean: 1.2518671751022339 	 loss mean: 144.08929443359375
nll mean: 142.99337768554688 	 kl mean: 1.2518671751022339 	 loss mean: 144.2452392578125


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.15it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.15it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.93it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.92it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]

nll mean: 142.6538848876953 	 kl mean: 1.2518671751022339 	 loss mean: 143.90576171875
nll mean: 143.15667724609375 	 kl mean: 1.2518671751022339 	 loss mean: 144.40855407714844
nll mean: 131.44268798828125 	 kl mean: 1.2193397283554077 	 loss mean: 132.66201782226562



                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 14.82it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.66it/s][A

nll mean: 131.27586364746094 	 kl mean: 1.2193397283554077 	 loss mean: 132.4951934814453
nll mean: 131.30667114257812 	 kl mean: 1.2193397283554077 	 loss mean: 132.52601623535156
nll mean: 131.30177307128906 	 kl mean: 1.2193397283554077 	 loss mean: 132.5211181640625



                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.55it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s][A

nll mean: 131.37362670898438 	 kl mean: 1.2193397283554077 	 loss mean: 132.5929718017578
nll mean: 131.42910766601562 	 kl mean: 1.2193397283554077 	 loss mean: 132.64845275878906
nll mean: 131.2240447998047 	 kl mean: 1.2193397283554077 	 loss mean: 132.44338989257812



                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.42it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.66it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.66it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.37it/s][A
 13%|█▎        | 5/38 [00:03<00:20,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 131.52157592773438 	 kl mean: 1.2193397283554077 	 loss mean: 132.7409210205078
nll mean: 131.25717163085938 	 kl mean: 1.2193397283554077 	 loss mean: 132.47650146484375
nll mean: 131.43231201171875 	 kl mean: 1.2193397283554077 	 loss mean: 132.65164184570312


                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.59it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 14.75it/s][A

nll mean: 127.72925567626953 	 kl mean: 1.093579888343811 	 loss mean: 128.8228302001953
nll mean: 127.8711166381836 	 kl mean: 1.093579888343811 	 loss mean: 128.96469116210938
nll mean: 127.71295928955078 	 kl mean: 1.093579888343811 	 loss mean: 128.80654907226562


                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 14.75it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.59it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.59it/s]
 40%|████      | 4/10 [00:00<00:00, 14.49it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.61it/s][A

nll mean: 127.71723937988281 	 kl mean: 1.093579888343811 	 loss mean: 128.81082153320312
nll mean: 127.7535400390625 	 kl mean: 1.093579888343811 	 loss mean: 128.84710693359375
nll mean: 127.78907012939453 	 kl mean: 1.093579888343811 	 loss mean: 128.88265991210938
nll mean: 127.6922378540039 	 kl mean: 1.093579888343811 	 loss mean: 128.78582763671875


                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.61it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.59it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.59it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.67it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.56it/s][A
 16%|█▌        | 6/38 [00:03<00:20,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.54it/s]

nll mean: 127.87342071533203 	 kl mean: 1.093579888343811 	 loss mean: 128.9669952392578
nll mean: 127.75701904296875 	 kl mean: 1.093579888343811 	 loss mean: 128.8505859375
nll mean: 127.70246887207031 	 kl mean: 1.093579888343811 	 loss mean: 128.79605102539062
nll mean: 139.43751525878906 	 kl mean: 1.0838031768798828 	 loss mean: 140.52130126953125



                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.54it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.54it/s]
 30%|███       | 3/10 [00:00<00:00, 25.69it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:20,  1.54it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.54it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.54it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.43it/s][A


nll mean: 139.36264038085938 	 kl mean: 1.0838031768798828 	 loss mean: 140.44644165039062
nll mean: 139.34237670898438 	 kl mean: 1.0838031768798828 	 loss mean: 140.4261932373047
nll mean: 139.51852416992188 	 kl mean: 1.0838031768798828 	 loss mean: 140.60232543945312
nll mean: 139.37229919433594 	 kl mean: 1.0838031768798828 	 loss mean: 140.45611572265625
nll mean: 139.411865234375 	 kl mean: 1.0838031768798828 	 loss mean: 140.49566650390625


                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.54it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.54it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:20,  1.54it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.21it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 24.99it/s][A
 18%|█▊        | 7/38 [00:04<00:17,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.74it/s]

nll mean: 139.32308959960938 	 kl mean: 1.0838031768798828 	 loss mean: 140.40689086914062
nll mean: 139.27615356445312 	 kl mean: 1.0838031768798828 	 loss mean: 140.35995483398438
nll mean: 139.26409912109375 	 kl mean: 1.0838031768798828 	 loss mean: 140.34793090820312
nll mean: 139.28634643554688 	 kl mean: 1.0838031768798828 	 loss mean: 140.37014770507812
nll mean: 111.569091796875 	 kl mean: 1.2248655557632446 	 loss mean: 112.79396057128906



                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.74it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 25.14it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.74it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.74it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.74it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.08it/s][A
[A                                           

nll mean: 111.13964080810547 	 kl mean: 1.2248655557632446 	 loss mean: 112.364501953125
nll mean: 111.26824188232422 	 kl mean: 1.2248655557632446 	 loss mean: 112.49310302734375
nll mean: 111.42778778076172 	 kl mean: 1.2248655557632446 	 loss mean: 112.65264892578125
nll mean: 111.22286987304688 	 kl mean: 1.2248655557632446 	 loss mean: 112.44773864746094
nll mean: 111.32215881347656 	 kl mean: 1.2248655557632446 	 loss mean: 112.54702758789062


                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.74it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.74it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:17,  1.74it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.00it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 24.85it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.91it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.91it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 111.23918914794922 	 kl mean: 1.2248655557632446 	 loss mean: 112.46405792236328
nll mean: 111.46408081054688 	 kl mean: 1.2248655557632446 	 loss mean: 112.68894958496094
nll mean: 111.19638061523438 	 kl mean: 1.2248655557632446 	 loss mean: 112.42124938964844
nll mean: 111.35649108886719 	 kl mean: 1.2248655557632446 	 loss mean: 112.58135986328125
nll mean: 136.5780487060547 	 kl mean: 1.2087877988815308 	 loss mean: 137.78683471679688


                                              
 21%|██        | 8/38 [00:04<00:15,  1.91it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.91it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.91it/s]
 20%|██        | 2/10 [00:00<00:00, 14.53it/s][A
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.91it/s]
 40%|████      | 4/10 [00:00<00:00, 14.99it/s][A

nll mean: 136.66702270507812 	 kl mean: 1.2087877988815308 	 loss mean: 137.87579345703125
nll mean: 136.63345336914062 	 kl mean: 1.2087877988815308 	 loss mean: 137.84225463867188
nll mean: 136.79806518554688 	 kl mean: 1.2087877988815308 	 loss mean: 138.00686645507812
nll mean: 136.94175720214844 	 kl mean: 1.2087877988815308 	 loss mean: 138.15054321289062


                                              
 21%|██        | 8/38 [00:05<00:15,  1.91it/s]
 40%|████      | 4/10 [00:00<00:00, 14.99it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.91it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.91it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.87it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.91it/s]
 80%|████████  | 8/10 [00:00<00:00, 15.16it/s][A

nll mean: 136.99026489257812 	 kl mean: 1.2087877988815308 	 loss mean: 138.1990509033203
nll mean: 136.8055419921875 	 kl mean: 1.2087877988815308 	 loss mean: 138.01431274414062
nll mean: 136.64486694335938 	 kl mean: 1.2087877988815308 	 loss mean: 137.8536376953125
nll mean: 136.7222442626953 	 kl mean: 1.2087877988815308 	 loss mean: 137.9310302734375


                                              
 21%|██        | 8/38 [00:05<00:15,  1.91it/s]
 80%|████████  | 8/10 [00:00<00:00, 15.16it/s][A
100%|██████████| 10/10 [00:00<00:00, 15.18it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s]
 30%|███       | 3/10 [00:00<00:00, 22.17it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s][A

nll mean: 136.64395141601562 	 kl mean: 1.2087877988815308 	 loss mean: 137.85272216796875
nll mean: 135.98361206054688 	 kl mean: 1.030126690864563 	 loss mean: 137.01373291015625
nll mean: 135.4679718017578 	 kl mean: 1.030126690864563 	 loss mean: 136.4980926513672
nll mean: 135.54449462890625 	 kl mean: 1.030126690864563 	 loss mean: 136.57461547851562
nll mean: 135.6444091796875 	 kl mean: 1.030126690864563 	 loss mean: 136.67453002929688



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.98it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.77it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.88it/s][A

nll mean: 135.7550048828125 	 kl mean: 1.030126690864563 	 loss mean: 136.78512573242188
nll mean: 135.6230010986328 	 kl mean: 1.030126690864563 	 loss mean: 136.65313720703125
nll mean: 135.8001708984375 	 kl mean: 1.030126690864563 	 loss mean: 136.83030700683594
nll mean: 135.59495544433594 	 kl mean: 1.030126690864563 	 loss mean: 136.62506103515625
nll mean: 135.80018615722656 	 kl mean: 1.030126690864563 	 loss mean: 136.830322265625



                                              
100%|██████████| 10/10 [00:00<00:00, 21.68it/s][A
 26%|██▋       | 10/38 [00:05<00:14,  1.87it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.87it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.87it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.87it/s]
 30%|███       | 3/10 [00:00<00:00, 24.90it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.87it/s][A

nll mean: 135.59719848632812 	 kl mean: 1.030126690864563 	 loss mean: 136.6273193359375
nll mean: 123.0098876953125 	 kl mean: 1.3766661882400513 	 loss mean: 124.38655853271484
nll mean: 123.00242614746094 	 kl mean: 1.3766661882400513 	 loss mean: 124.37909698486328
nll mean: 122.99150085449219 	 kl mean: 1.3766661882400513 	 loss mean: 124.3681640625
nll mean: 122.83134460449219 	 kl mean: 1.3766661882400513 	 loss mean: 124.20801544189453



                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.87it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:14,  1.87it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.77it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:14,  1.87it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:14,  1.87it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:14,  1.87it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.65it/s][A

nll mean: 123.06468200683594 	 kl mean: 1.3766661882400513 	 loss mean: 124.44135284423828
nll mean: 123.06541442871094 	 kl mean: 1.3766661882400513 	 loss mean: 124.44207763671875
nll mean: 122.87528991699219 	 kl mean: 1.3766661882400513 	 loss mean: 124.25196075439453
nll mean: 123.04447937011719 	 kl mean: 1.3766661882400513 	 loss mean: 124.42115783691406
nll mean: 123.02676391601562 	 kl mean: 1.3766661882400513 	 loss mean: 124.40342712402344



                                               
100%|██████████| 10/10 [00:00<00:00, 24.49it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 21.42it/s][A

nll mean: 123.03396606445312 	 kl mean: 1.3766661882400513 	 loss mean: 124.41064453125
nll mean: 146.44436645507812 	 kl mean: 1.2105891704559326 	 loss mean: 147.65493774414062
nll mean: 146.2667236328125 	 kl mean: 1.2105891704559326 	 loss mean: 147.477294921875
nll mean: 146.66384887695312 	 kl mean: 1.2105891704559326 	 loss mean: 147.8744354248047
nll mean: 146.3349609375 	 kl mean: 1.2105891704559326 	 loss mean: 147.54554748535156


                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 21.42it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.32it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.53it/s][A

nll mean: 146.43675231933594 	 kl mean: 1.2105891704559326 	 loss mean: 147.6473388671875
nll mean: 146.58148193359375 	 kl mean: 1.2105891704559326 	 loss mean: 147.7920684814453
nll mean: 146.31936645507812 	 kl mean: 1.2105891704559326 	 loss mean: 147.52996826171875
nll mean: 146.35252380371094 	 kl mean: 1.2105891704559326 	 loss mean: 147.5631103515625
nll mean: 146.38162231445312 	 kl mean: 1.2105891704559326 	 loss mean: 147.59222412109375


                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
100%|██████████| 10/10 [00:00<00:00, 21.49it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.05it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.05it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.05it/s]
 20%|██        | 2/10 [00:00<00:00, 12.41it/s][A

nll mean: 146.369873046875 	 kl mean: 1.2105891704559326 	 loss mean: 147.5804443359375
nll mean: 123.94513702392578 	 kl mean: 1.4619293212890625 	 loss mean: 125.40706634521484
nll mean: 124.19169616699219 	 kl mean: 1.4619293212890625 	 loss mean: 125.65362548828125



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.05it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.05it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.49it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.05it/s][A

nll mean: 124.03912353515625 	 kl mean: 1.4619293212890625 	 loss mean: 125.50104522705078
nll mean: 124.01551818847656 	 kl mean: 1.4619293212890625 	 loss mean: 125.47743225097656
nll mean: 124.14663696289062 	 kl mean: 1.4619293212890625 	 loss mean: 125.60856628417969



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.05it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.56it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.05it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.05it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.56it/s][A

nll mean: 123.94912719726562 	 kl mean: 1.4619293212890625 	 loss mean: 125.41104888916016
nll mean: 124.08523559570312 	 kl mean: 1.4619293212890625 	 loss mean: 125.54716491699219
nll mean: 123.97655487060547 	 kl mean: 1.4619293212890625 	 loss mean: 125.43849182128906



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.05it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.05it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.64it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s]

nll mean: 123.77487182617188 	 kl mean: 1.4619293212890625 	 loss mean: 125.23680114746094
nll mean: 123.91718292236328 	 kl mean: 1.4619293212890625 	 loss mean: 125.37911224365234
nll mean: 167.54615783691406 	 kl mean: 1.3721503019332886 	 loss mean: 168.91830444335938



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s]
 20%|██        | 2/10 [00:00<00:00, 10.10it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.03it/s][A
[A                                           

nll mean: 167.539306640625 	 kl mean: 1.3721503019332886 	 loss mean: 168.91146850585938
nll mean: 167.45127868652344 	 kl mean: 1.3721503019332886 	 loss mean: 168.82342529296875


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.03it/s][A
                                               

nll mean: 167.83590698242188 	 kl mean: 1.3721503019332886 	 loss mean: 169.20803833007812
nll mean: 167.5209503173828 	 kl mean: 1.3721503019332886 	 loss mean: 168.89309692382812



 34%|███▍      | 13/38 [00:08<00:14,  1.72it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.98it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.72it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.99it/s][A

nll mean: 167.62319946289062 	 kl mean: 1.3721503019332886 	 loss mean: 168.995361328125
nll mean: 167.7342529296875 	 kl mean: 1.3721503019332886 	 loss mean: 169.10638427734375



                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.72it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.89it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.72it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.72it/s][A

nll mean: 167.55850219726562 	 kl mean: 1.3721503019332886 	 loss mean: 168.93064880371094
nll mean: 167.64234924316406 	 kl mean: 1.3721503019332886 	 loss mean: 169.01449584960938
nll mean: 167.69146728515625 	 kl mean: 1.3721503019332886 	 loss mean: 169.06361389160156



100%|██████████| 10/10 [00:01<00:00,  9.97it/s][A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 20%|██        | 2/10 [00:00<00:00, 18.31it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s][A
 40%|████      | 4/10 [00:00<00:00, 18.19it/s][A

nll mean: 141.05624389648438 	 kl mean: 1.1247355937957764 	 loss mean: 142.18096923828125
nll mean: 140.99398803710938 	 kl mean: 1.1247355937957764 	 loss mean: 142.11874389648438
nll mean: 141.307373046875 	 kl mean: 1.1247355937957764 	 loss mean: 142.43209838867188
nll mean: 141.29806518554688 	 kl mean: 1.1247355937957764 	 loss mean: 142.4228057861328



                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s][A
 60%|██████    | 6/10 [00:00<00:00, 18.14it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s][A
 80%|████████  | 8/10 [00:00<00:00, 18.11it/s][A

nll mean: 141.22975158691406 	 kl mean: 1.1247355937957764 	 loss mean: 142.3544921875
nll mean: 141.26113891601562 	 kl mean: 1.1247355937957764 	 loss mean: 142.38587951660156
nll mean: 141.36083984375 	 kl mean: 1.1247355937957764 	 loss mean: 142.48556518554688
nll mean: 141.56040954589844 	 kl mean: 1.1247355937957764 	 loss mean: 142.68515014648438



                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s][A
100%|██████████| 10/10 [00:00<00:00, 18.11it/s][A
 39%|███▉      | 15/38 [00:08<00:15,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]

nll mean: 141.12356567382812 	 kl mean: 1.1247355937957764 	 loss mean: 142.24830627441406
nll mean: 141.2408905029297 	 kl mean: 1.1247355937957764 	 loss mean: 142.36563110351562
nll mean: 148.01617431640625 	 kl mean: 1.4161932468414307 	 loss mean: 149.432373046875



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 20%|██        | 2/10 [00:00<00:00, 10.77it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.84it/s][A

nll mean: 148.0359344482422 	 kl mean: 1.4161932468414307 	 loss mean: 149.4521484375
nll mean: 148.1424102783203 	 kl mean: 1.4161932468414307 	 loss mean: 149.55859375
nll mean: 148.04580688476562 	 kl mean: 1.4161932468414307 	 loss mean: 149.46200561523438



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.86it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A

nll mean: 148.46044921875 	 kl mean: 1.4161932468414307 	 loss mean: 149.87664794921875
nll mean: 148.2212677001953 	 kl mean: 1.4161932468414307 	 loss mean: 149.63746643066406
nll mean: 148.33380126953125 	 kl mean: 1.4161932468414307 	 loss mean: 149.75



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.86it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.82it/s][A
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 148.35336303710938 	 kl mean: 1.4161932468414307 	 loss mean: 149.76956176757812
nll mean: 148.15658569335938 	 kl mean: 1.4161932468414307 	 loss mean: 149.57278442382812
nll mean: 148.1254119873047 	 kl mean: 1.4161932468414307 	 loss mean: 149.54159545898438



                                               
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
                                               
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
 30%|███       | 3/10 [00:00<00:00, 25.09it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s][A

nll mean: 149.577392578125 	 kl mean: 1.2053974866867065 	 loss mean: 150.78277587890625
nll mean: 149.68821716308594 	 kl mean: 1.2053974866867065 	 loss mean: 150.89361572265625
nll mean: 149.8865966796875 	 kl mean: 1.2053974866867065 	 loss mean: 151.09197998046875
nll mean: 149.77145385742188 	 kl mean: 1.2053974866867065 	 loss mean: 150.97683715820312
nll mean: 149.86447143554688 	 kl mean: 1.2053974866867065 	 loss mean: 151.0698699951172



                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.93it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.88it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 24.80it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 149.62728881835938 	 kl mean: 1.2053974866867065 	 loss mean: 150.83270263671875
nll mean: 149.7905731201172 	 kl mean: 1.2053974866867065 	 loss mean: 150.9959716796875
nll mean: 149.79257202148438 	 kl mean: 1.2053974866867065 	 loss mean: 150.99798583984375
nll mean: 149.83169555664062 	 kl mean: 1.2053974866867065 	 loss mean: 151.03709411621094
nll mean: 149.88677978515625 	 kl mean: 1.2053974866867065 	 loss mean: 151.09219360351562



                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
 30%|███       | 3/10 [00:00<00:00, 25.22it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s][A

nll mean: 138.68048095703125 	 kl mean: 1.2519629001617432 	 loss mean: 139.9324493408203
nll mean: 138.368896484375 	 kl mean: 1.2519629001617432 	 loss mean: 139.62086486816406
nll mean: 138.52066040039062 	 kl mean: 1.2519629001617432 	 loss mean: 139.77261352539062
nll mean: 138.33331298828125 	 kl mean: 1.2519629001617432 	 loss mean: 139.5852813720703
nll mean: 138.33987426757812 	 kl mean: 1.2519629001617432 	 loss mean: 139.59182739257812
nll mean: 138.37120056152344 	 kl mean: 1.2519629001617432 	 loss mean: 139.6231689453125



 60%|██████    | 6/10 [00:00<00:00, 25.24it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.21it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.18it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.76it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
[A                                   

nll mean: 138.38037109375 	 kl mean: 1.2519629001617432 	 loss mean: 139.63232421875
nll mean: 138.0994873046875 	 kl mean: 1.2519629001617432 	 loss mean: 139.3514404296875
nll mean: 138.17626953125 	 kl mean: 1.2519629001617432 	 loss mean: 139.42822265625
nll mean: 138.62301635742188 	 kl mean: 1.2519629001617432 	 loss mean: 139.87496948242188


                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.76it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.76it/s]
 20%|██        | 2/10 [00:00<00:00, 12.82it/s][A
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.76it/s][A

nll mean: 135.21163940429688 	 kl mean: 1.1756045818328857 	 loss mean: 136.3872528076172
nll mean: 134.9549560546875 	 kl mean: 1.1756045818328857 	 loss mean: 136.13055419921875
nll mean: 135.0848388671875 	 kl mean: 1.1756045818328857 	 loss mean: 136.2604522705078



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.76it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.84it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.76it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.76it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.92it/s][A

nll mean: 134.88455200195312 	 kl mean: 1.1756045818328857 	 loss mean: 136.06016540527344
nll mean: 134.9899444580078 	 kl mean: 1.1756045818328857 	 loss mean: 136.16554260253906
nll mean: 134.921875 	 kl mean: 1.1756045818328857 	 loss mean: 136.09747314453125



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.76it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.76it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.87it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.76it/s][A

nll mean: 135.05685424804688 	 kl mean: 1.1756045818328857 	 loss mean: 136.23248291015625
nll mean: 135.02838134765625 	 kl mean: 1.1756045818328857 	 loss mean: 136.20401000976562
nll mean: 135.0152587890625 	 kl mean: 1.1756045818328857 	 loss mean: 136.19085693359375



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.76it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.81it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.25it/s][A

nll mean: 135.09518432617188 	 kl mean: 1.1756045818328857 	 loss mean: 136.27078247070312
nll mean: 153.86984252929688 	 kl mean: 1.1732611656188965 	 loss mean: 155.04310607910156
nll mean: 153.89407348632812 	 kl mean: 1.1732611656188965 	 loss mean: 155.06732177734375



                                               
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.29it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s][A

nll mean: 153.7161865234375 	 kl mean: 1.1732611656188965 	 loss mean: 154.8894500732422
nll mean: 153.85293579101562 	 kl mean: 1.1732611656188965 	 loss mean: 155.0261993408203
nll mean: 153.97744750976562 	 kl mean: 1.1732611656188965 	 loss mean: 155.1507110595703



                                               
 50%|█████     | 19/38 [00:11<00:12,  1.58it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.33it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.58it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.58it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.36it/s][A

nll mean: 154.06573486328125 	 kl mean: 1.1732611656188965 	 loss mean: 155.23898315429688
nll mean: 153.93826293945312 	 kl mean: 1.1732611656188965 	 loss mean: 155.11151123046875
nll mean: 153.83346557617188 	 kl mean: 1.1732611656188965 	 loss mean: 155.0067138671875



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.58it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.58it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.41it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 153.8472900390625 	 kl mean: 1.1732611656188965 	 loss mean: 155.02053833007812
nll mean: 153.93359375 	 kl mean: 1.1732611656188965 	 loss mean: 155.1068572998047
nll mean: 162.1343994140625 	 kl mean: 1.1645419597625732 	 loss mean: 163.2989501953125


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 13.25it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.07it/s][A

nll mean: 161.74127197265625 	 kl mean: 1.1645419597625732 	 loss mean: 162.90579223632812
nll mean: 162.06385803222656 	 kl mean: 1.1645419597625732 	 loss mean: 163.2283935546875
nll mean: 162.052490234375 	 kl mean: 1.1645419597625732 	 loss mean: 163.21702575683594


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 13.07it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.89it/s][A

nll mean: 161.92587280273438 	 kl mean: 1.1645419597625732 	 loss mean: 163.09042358398438
nll mean: 161.74533081054688 	 kl mean: 1.1645419597625732 	 loss mean: 162.9098663330078
nll mean: 162.14154052734375 	 kl mean: 1.1645419597625732 	 loss mean: 163.30609130859375


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.89it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.46it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.78it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.76it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 162.21865844726562 	 kl mean: 1.1645419597625732 	 loss mean: 163.38320922851562
nll mean: 161.86978149414062 	 kl mean: 1.1645419597625732 	 loss mean: 163.03433227539062
nll mean: 162.02450561523438 	 kl mean: 1.1645419597625732 	 loss mean: 163.1890411376953



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 10.41it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s][A

nll mean: 122.98677062988281 	 kl mean: 1.2714086771011353 	 loss mean: 124.2581787109375
nll mean: 122.90848541259766 	 kl mean: 1.2714086771011353 	 loss mean: 124.17990112304688
nll mean: 122.93115997314453 	 kl mean: 1.2714086771011353 	 loss mean: 124.20256805419922



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.31it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.30it/s][A

nll mean: 122.91390991210938 	 kl mean: 1.2714086771011353 	 loss mean: 124.1853256225586
nll mean: 122.84513854980469 	 kl mean: 1.2714086771011353 	 loss mean: 124.11654663085938
nll mean: 122.92076873779297 	 kl mean: 1.2714086771011353 	 loss mean: 124.19217681884766



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.35it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s][A

nll mean: 122.53878784179688 	 kl mean: 1.2714086771011353 	 loss mean: 123.8102035522461
nll mean: 122.9898910522461 	 kl mean: 1.2714086771011353 	 loss mean: 124.26130676269531
nll mean: 123.05816650390625 	 kl mean: 1.2714086771011353 	 loss mean: 124.32957458496094



                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.40it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.29it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
 40%|████      | 4/10 [00:00<00:00, 33.50it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s][A

nll mean: 122.94660949707031 	 kl mean: 1.2714086771011353 	 loss mean: 124.218017578125
nll mean: 110.63128662109375 	 kl mean: 0.8659622669219971 	 loss mean: 111.49724578857422
nll mean: 110.38861846923828 	 kl mean: 0.8659622669219971 	 loss mean: 111.25458526611328
nll mean: 110.55874633789062 	 kl mean: 0.8659622669219971 	 loss mean: 111.42471313476562
nll mean: 110.60236358642578 	 kl mean: 0.8659622669219971 	 loss mean: 111.46832275390625
nll mean: 110.7573471069336 	 kl mean: 0.8659622669219971 	 loss mean: 111.62330627441406
nll mean: 110.74203491210938 	 kl mean: 0.8659622669219971 	 loss mean: 111.60799407958984



                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s][A
 80%|████████  | 8/10 [00:00<00:00, 33.23it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 32.93it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]

nll mean: 110.62512969970703 	 kl mean: 0.8659622669219971 	 loss mean: 111.4910888671875
nll mean: 110.51644134521484 	 kl mean: 0.8659622669219971 	 loss mean: 111.38240051269531
nll mean: 110.50079345703125 	 kl mean: 0.8659622669219971 	 loss mean: 111.36675262451172
nll mean: 110.61885833740234 	 kl mean: 0.8659622669219971 	 loss mean: 111.48481750488281
nll mean: 164.22607421875 	 kl mean: 1.0969346761703491 	 loss mean: 165.32301330566406



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 14.74it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.77it/s][A


nll mean: 164.32806396484375 	 kl mean: 1.0969346761703491 	 loss mean: 165.4250030517578
nll mean: 164.2628631591797 	 kl mean: 1.0969346761703491 	 loss mean: 165.35980224609375
nll mean: 164.3746337890625 	 kl mean: 1.0969346761703491 	 loss mean: 165.47157287597656


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.73it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A

nll mean: 164.3258819580078 	 kl mean: 1.0969346761703491 	 loss mean: 165.42282104492188
nll mean: 164.22035217285156 	 kl mean: 1.0969346761703491 	 loss mean: 165.31729125976562
nll mean: 164.29632568359375 	 kl mean: 1.0969346761703491 	 loss mean: 165.3932647705078



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.75it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.55it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.70it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]

nll mean: 164.2371826171875 	 kl mean: 1.0969346761703491 	 loss mean: 165.33412170410156
nll mean: 164.40872192382812 	 kl mean: 1.0969346761703491 	 loss mean: 165.5056610107422
nll mean: 164.2512664794922 	 kl mean: 1.0969346761703491 	 loss mean: 165.34820556640625
nll mean: 125.1981430053711 	 kl mean: 1.1991827487945557 	 loss mean: 126.39732360839844



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 22.03it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.83it/s][A

nll mean: 125.26458740234375 	 kl mean: 1.1991827487945557 	 loss mean: 126.46376037597656
nll mean: 125.39601135253906 	 kl mean: 1.1991827487945557 	 loss mean: 126.5951919555664
nll mean: 125.32600402832031 	 kl mean: 1.1991827487945557 	 loss mean: 126.52517700195312
nll mean: 125.39985656738281 	 kl mean: 1.1991827487945557 	 loss mean: 126.59903717041016
nll mean: 125.24602508544922 	 kl mean: 1.1991827487945557 	 loss mean: 126.44520568847656



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.74it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.71it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 125.1654052734375 	 kl mean: 1.1991827487945557 	 loss mean: 126.36458587646484
nll mean: 125.44056701660156 	 kl mean: 1.1991827487945557 	 loss mean: 126.63975524902344
nll mean: 125.52013397216797 	 kl mean: 1.1991827487945557 	 loss mean: 126.71932220458984
nll mean: 125.39218139648438 	 kl mean: 1.1991827487945557 	 loss mean: 126.59136962890625


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s]
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s]


nll mean: 120.88221740722656 	 kl mean: 1.136910319328308 	 loss mean: 122.01913452148438
nll mean: 120.84225463867188 	 kl mean: 1.136910319328308 	 loss mean: 121.97916412353516
nll mean: 121.08135986328125 	 kl mean: 1.136910319328308 	 loss mean: 122.21826934814453
nll mean: 120.82640838623047 	 kl mean: 1.136910319328308 	 loss mean: 121.96331787109375


 20%|██        | 2/10 [00:00<00:00, 14.70it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s]
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s]
 40%|████      | 4/10 [00:00<00:00, 14.84it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s]
                                               [A

nll mean: 120.80110168457031 	 kl mean: 1.136910319328308 	 loss mean: 121.93800354003906
nll mean: 120.90524291992188 	 kl mean: 1.136910319328308 	 loss mean: 122.04215240478516
nll mean: 120.94075012207031 	 kl mean: 1.136910319328308 	 loss mean: 122.07765197753906



 66%|██████▌   | 25/38 [00:16<00:07,  1.67it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.84it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.67it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.67it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.87it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.87it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.61it/s]

nll mean: 121.05902099609375 	 kl mean: 1.136910319328308 	 loss mean: 122.19593048095703
nll mean: 121.03450775146484 	 kl mean: 1.136910319328308 	 loss mean: 122.17142486572266
nll mean: 120.93601989746094 	 kl mean: 1.136910319328308 	 loss mean: 122.07293701171875
nll mean: 86.6778564453125 	 kl mean: 1.2180222272872925 	 loss mean: 87.8958740234375



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.61it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.61it/s]
 30%|███       | 3/10 [00:00<00:00, 22.41it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.61it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.61it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.61it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.26it/s][A

nll mean: 86.7096176147461 	 kl mean: 1.2180222272872925 	 loss mean: 87.92764282226562
nll mean: 86.63729858398438 	 kl mean: 1.2180222272872925 	 loss mean: 87.8553237915039
nll mean: 86.70903778076172 	 kl mean: 1.2180222272872925 	 loss mean: 87.92706298828125
nll mean: 86.68067932128906 	 kl mean: 1.2180222272872925 	 loss mean: 87.8987045288086
nll mean: 86.60367584228516 	 kl mean: 1.2180222272872925 	 loss mean: 87.82170104980469



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.61it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.61it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.61it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.63it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 22.65it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 86.77395629882812 	 kl mean: 1.2180222272872925 	 loss mean: 87.99197387695312
nll mean: 86.52191925048828 	 kl mean: 1.2180222272872925 	 loss mean: 87.73994445800781
nll mean: 86.55599975585938 	 kl mean: 1.2180222272872925 	 loss mean: 87.7740249633789
nll mean: 86.64388275146484 	 kl mean: 1.2180222272872925 	 loss mean: 87.86190795898438
nll mean: 113.12632751464844 	 kl mean: 1.0213744640350342 	 loss mean: 114.147705078125


                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
 30%|███       | 3/10 [00:00<00:00, 21.82it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.94it/s][A

nll mean: 112.95140838623047 	 kl mean: 1.0213744640350342 	 loss mean: 113.9727783203125
nll mean: 112.72505950927734 	 kl mean: 1.0213744640350342 	 loss mean: 113.74642944335938
nll mean: 112.94355773925781 	 kl mean: 1.0213744640350342 	 loss mean: 113.96493530273438
nll mean: 112.92243957519531 	 kl mean: 1.0213744640350342 	 loss mean: 113.94380950927734
nll mean: 113.01420593261719 	 kl mean: 1.0213744640350342 	 loss mean: 114.03558349609375


                                               
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.76it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.76it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.94it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.76it/s]
100%|██████████| 10/10 [00:00<00:00, 21.98it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 112.953125 	 kl mean: 1.0213744640350342 	 loss mean: 113.97450256347656
nll mean: 113.29759979248047 	 kl mean: 1.0213744640350342 	 loss mean: 114.31897735595703
nll mean: 113.0118408203125 	 kl mean: 1.0213744640350342 	 loss mean: 114.03321838378906
nll mean: 113.04737854003906 	 kl mean: 1.0213744640350342 	 loss mean: 114.06875610351562



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s]
 20%|██        | 2/10 [00:00<00:00, 12.61it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A

nll mean: 125.90528869628906 	 kl mean: 1.1334863901138306 	 loss mean: 127.03877258300781
nll mean: 126.14623260498047 	 kl mean: 1.1334863901138306 	 loss mean: 127.27972412109375
nll mean: 126.06289672851562 	 kl mean: 1.1334863901138306 	 loss mean: 127.19638061523438



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.73it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.61it/s][A

nll mean: 126.1800537109375 	 kl mean: 1.1334863901138306 	 loss mean: 127.31353759765625
nll mean: 126.15726470947266 	 kl mean: 1.1334863901138306 	 loss mean: 127.29075622558594
nll mean: 126.03876495361328 	 kl mean: 1.1334863901138306 	 loss mean: 127.17224884033203



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.54it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A

nll mean: 126.17743682861328 	 kl mean: 1.1334863901138306 	 loss mean: 127.31092834472656
nll mean: 126.176513671875 	 kl mean: 1.1334863901138306 	 loss mean: 127.30999755859375
nll mean: 125.92288970947266 	 kl mean: 1.1334863901138306 	 loss mean: 127.05638122558594



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.87it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.54it/s][A
 76%|███████▋  | 29/38 [00:17<00:05,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 76%|███████▋  | 29/38 [00:17<00:05,  1.63it/s]
                                               


nll mean: 126.1306381225586 	 kl mean: 1.1334863901138306 	 loss mean: 127.26411437988281
nll mean: 66.78065490722656 	 kl mean: 1.4080675840377808 	 loss mean: 68.188720703125
nll mean: 66.71162414550781 	 kl mean: 1.4080675840377808 	 loss mean: 68.11968994140625


 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s]
 20%|██        | 2/10 [00:00<00:00, 10.17it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.23it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A

nll mean: 66.86804962158203 	 kl mean: 1.4080675840377808 	 loss mean: 68.27611541748047
nll mean: 66.49811553955078 	 kl mean: 1.4080675840377808 	 loss mean: 67.90618133544922
nll mean: 66.64048767089844 	 kl mean: 1.4080675840377808 	 loss mean: 68.04855346679688



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.25it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.31it/s][A

nll mean: 66.8225326538086 	 kl mean: 1.4080675840377808 	 loss mean: 68.23059844970703
nll mean: 66.55448150634766 	 kl mean: 1.4080675840377808 	 loss mean: 67.9625473022461
nll mean: 66.511474609375 	 kl mean: 1.4080675840377808 	 loss mean: 67.91954040527344



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.63it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.28it/s][A
 79%|███████▉  | 30/38 [00:18<00:05,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 79%|███████▉  | 30/38 [00:18<00:05,  1.38it/s]

nll mean: 66.4178466796875 	 kl mean: 1.4080675840377808 	 loss mean: 67.82591247558594
nll mean: 66.3995132446289 	 kl mean: 1.4080675840377808 	 loss mean: 67.80757141113281
nll mean: 108.98279571533203 	 kl mean: 1.3651816844940186 	 loss mean: 110.34797668457031



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 12.82it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.96it/s][A

nll mean: 108.8766098022461 	 kl mean: 1.3651816844940186 	 loss mean: 110.24178314208984
nll mean: 108.81526184082031 	 kl mean: 1.3651816844940186 	 loss mean: 110.18045043945312
nll mean: 108.97966766357422 	 kl mean: 1.3651816844940186 	 loss mean: 110.3448486328125



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.91it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A

nll mean: 108.99928283691406 	 kl mean: 1.3651816844940186 	 loss mean: 110.36447143554688
nll mean: 109.04818725585938 	 kl mean: 1.3651816844940186 	 loss mean: 110.41336822509766
nll mean: 108.80197143554688 	 kl mean: 1.3651816844940186 	 loss mean: 110.16716003417969



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.92it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.95it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 109.11306762695312 	 kl mean: 1.3651816844940186 	 loss mean: 110.47825622558594
nll mean: 108.83305358886719 	 kl mean: 1.3651816844940186 	 loss mean: 110.1982421875
nll mean: 108.92181396484375 	 kl mean: 1.3651816844940186 	 loss mean: 110.28700256347656



                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]
 20%|██        | 2/10 [00:00<00:00, 10.22it/s][A
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s][A

nll mean: 142.58908081054688 	 kl mean: 1.2102267742156982 	 loss mean: 143.79930114746094
nll mean: 142.54185485839844 	 kl mean: 1.2102267742156982 	 loss mean: 143.7520751953125
nll mean: 142.7325439453125 	 kl mean: 1.2102267742156982 	 loss mean: 143.94276428222656



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.17it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.11it/s][A
                                              

nll mean: 142.87213134765625 	 kl mean: 1.2102267742156982 	 loss mean: 144.0823516845703
nll mean: 142.49667358398438 	 kl mean: 1.2102267742156982 	 loss mean: 143.70689392089844


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.04it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.01it/s][A


nll mean: 142.86276245117188 	 kl mean: 1.2102267742156982 	 loss mean: 144.072998046875
nll mean: 142.76358032226562 	 kl mean: 1.2102267742156982 	 loss mean: 143.97381591796875


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.97it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.87it/s][A

nll mean: 142.61228942871094 	 kl mean: 1.2102267742156982 	 loss mean: 143.822509765625
nll mean: 142.8585205078125 	 kl mean: 1.2102267742156982 	 loss mean: 144.06875610351562



                                               
100%|██████████| 10/10 [00:01<00:00,  9.99it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
 30%|███       | 3/10 [00:00<00:00, 26.27it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s][A

nll mean: 142.75621032714844 	 kl mean: 1.2102267742156982 	 loss mean: 143.9664306640625
nll mean: 66.05846405029297 	 kl mean: 1.3233745098114014 	 loss mean: 67.3818359375
nll mean: 66.2470932006836 	 kl mean: 1.3233745098114014 	 loss mean: 67.57046508789062
nll mean: 66.25056457519531 	 kl mean: 1.3233745098114014 	 loss mean: 67.57393646240234
nll mean: 66.27742004394531 	 kl mean: 1.3233745098114014 	 loss mean: 67.60079956054688
nll mean: 66.68408203125 	 kl mean: 1.3233745098114014 	 loss mean: 68.00746154785156



                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.99it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.87it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.72it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 66.34119415283203 	 kl mean: 1.3233745098114014 	 loss mean: 67.66456604003906
nll mean: 66.42277526855469 	 kl mean: 1.3233745098114014 	 loss mean: 67.74615478515625
nll mean: 66.25729370117188 	 kl mean: 1.3233745098114014 	 loss mean: 67.5806655883789
nll mean: 66.4373779296875 	 kl mean: 1.3233745098114014 	 loss mean: 67.76074981689453
nll mean: 66.45630645751953 	 kl mean: 1.3233745098114014 	 loss mean: 67.77967834472656



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s]
 30%|███       | 3/10 [00:00<00:00, 22.29it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s][A

nll mean: 124.34030151367188 	 kl mean: 1.0855529308319092 	 loss mean: 125.42585754394531
nll mean: 124.38090515136719 	 kl mean: 1.0855529308319092 	 loss mean: 125.46646118164062
nll mean: 124.18465423583984 	 kl mean: 1.0855529308319092 	 loss mean: 125.27021026611328
nll mean: 124.31510925292969 	 kl mean: 1.0855529308319092 	 loss mean: 125.40065002441406
nll mean: 124.3219985961914 	 kl mean: 1.0855529308319092 	 loss mean: 125.40755462646484



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.18it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.45it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.09it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 22.02it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.4322509765625 	 kl mean: 1.0855529308319092 	 loss mean: 125.51780700683594
nll mean: 124.23727416992188 	 kl mean: 1.0855529308319092 	 loss mean: 125.32283020019531
nll mean: 124.06791687011719 	 kl mean: 1.0855529308319092 	 loss mean: 125.15347290039062
nll mean: 124.23760223388672 	 kl mean: 1.0855529308319092 	 loss mean: 125.32315063476562
nll mean: 124.21534729003906 	 kl mean: 1.0855529308319092 	 loss mean: 125.3009033203125


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 12.31it/s][A

nll mean: 124.29293060302734 	 kl mean: 1.1687871217727661 	 loss mean: 125.46170806884766
nll mean: 124.367431640625 	 kl mean: 1.1687871217727661 	 loss mean: 125.53620910644531
nll mean: 124.40377044677734 	 kl mean: 1.1687871217727661 	 loss mean: 125.57255554199219


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 12.31it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
 40%|████      | 4/10 [00:00<00:00, 12.37it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.53it/s][A

nll mean: 124.51869201660156 	 kl mean: 1.1687871217727661 	 loss mean: 125.6874771118164
nll mean: 124.401123046875 	 kl mean: 1.1687871217727661 	 loss mean: 125.56991577148438
nll mean: 124.48672485351562 	 kl mean: 1.1687871217727661 	 loss mean: 125.655517578125


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.53it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.68it/s][A

nll mean: 124.46520233154297 	 kl mean: 1.1687871217727661 	 loss mean: 125.63398742675781
nll mean: 124.33335876464844 	 kl mean: 1.1687871217727661 	 loss mean: 125.50214385986328
nll mean: 124.56266021728516 	 kl mean: 1.1687871217727661 	 loss mean: 125.7314453125


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.68it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.63it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
 20%|██        | 2/10 [00:00<00:00, 10.73it/s][A

nll mean: 124.59528350830078 	 kl mean: 1.1687871217727661 	 loss mean: 125.76406860351562
nll mean: 118.54499816894531 	 kl mean: 1.2332239151000977 	 loss mean: 119.77821350097656
nll mean: 118.61978149414062 	 kl mean: 1.2332239151000977 	 loss mean: 119.85301208496094



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.68it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s][A

nll mean: 118.6609878540039 	 kl mean: 1.2332239151000977 	 loss mean: 119.89421844482422
nll mean: 118.66069030761719 	 kl mean: 1.2332239151000977 	 loss mean: 119.8939208984375
nll mean: 118.60084533691406 	 kl mean: 1.2332239151000977 	 loss mean: 119.83406829833984



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.65it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.49it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.67it/s][A

nll mean: 118.56010437011719 	 kl mean: 1.2332239151000977 	 loss mean: 119.79332733154297
nll mean: 118.49081420898438 	 kl mean: 1.2332239151000977 	 loss mean: 119.72404479980469
nll mean: 118.46880340576172 	 kl mean: 1.2332239151000977 	 loss mean: 119.7020263671875



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.49it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.49it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.64it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]

nll mean: 118.50284576416016 	 kl mean: 1.2332239151000977 	 loss mean: 119.73606872558594
nll mean: 118.63134765625 	 kl mean: 1.2332239151000977 	 loss mean: 119.86457061767578
nll mean: 116.6262435913086 	 kl mean: 1.0446960926055908 	 loss mean: 117.67093658447266
nll mean: 116.91450500488281 	 kl mean: 1.0446960926055908 	 loss mean: 117.9592056274414



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 21.53it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.41it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A

nll mean: 116.88685607910156 	 kl mean: 1.0446960926055908 	 loss mean: 117.93155670166016
nll mean: 116.8405990600586 	 kl mean: 1.0446960926055908 	 loss mean: 117.88529205322266
nll mean: 116.739990234375 	 kl mean: 1.0446960926055908 	 loss mean: 117.7846908569336
nll mean: 116.5497055053711 	 kl mean: 1.0446960926055908 	 loss mean: 117.59439086914062
nll mean: 116.5821533203125 	 kl mean: 1.0446960926055908 	 loss mean: 117.62684631347656



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.53it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.64it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]

nll mean: 116.55674743652344 	 kl mean: 1.0446960926055908 	 loss mean: 117.60144805908203
nll mean: 116.80777740478516 	 kl mean: 1.0446960926055908 	 loss mean: 117.85246276855469
nll mean: 116.87850952148438 	 kl mean: 1.0446960926055908 	 loss mean: 117.92320251464844
nll mean: 89.81968688964844 	 kl mean: 1.7276853322982788 	 loss mean: 91.54736328125
nll mean: 90.16035461425781 	 kl mean: 1.7276853322982788 	 loss mean: 91.88804626464844
nll mean: 90.04209899902344 	 kl mean: 1.7276853322982788 	 loss mean: 91.769775390625



                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
 40%|████      | 4/10 [00:00<00:00, 30.85it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s][A
 80%|████████  | 8/10 [00:00<00:00, 30.87it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 30.68it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.58it/s]


nll mean: 89.76492309570312 	 kl mean: 1.7276853322982788 	 loss mean: 91.49261474609375
nll mean: 89.7820053100586 	 kl mean: 1.7276853322982788 	 loss mean: 91.50969696044922
nll mean: 90.08540344238281 	 kl mean: 1.7276853322982788 	 loss mean: 91.81309509277344
nll mean: 90.03085327148438 	 kl mean: 1.7276853322982788 	 loss mean: 91.758544921875
nll mean: 89.83751678466797 	 kl mean: 1.7276853322982788 	 loss mean: 91.56520080566406
nll mean: 89.92997741699219 	 kl mean: 1.7276853322982788 	 loss mean: 91.65767669677734
nll mean: 90.04618835449219 	 kl mean: 1.7276853322982788 	 loss mean: 91.77388000488281
Approximate NLL:
tensor(126.3611, device='cuda:0')
Approximate KL:
tensor(1.2080, device='cuda:0')
Testing took 0:00:24.962657


  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .96it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .96it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .96it/s][A

nll mean: 117.78890991210938 	 kl mean: 0.9688363671302795 	 loss mean: 118.75775146484375
nll mean: 117.51731872558594 	 kl mean: 0.9688363671302795 	 loss mean: 118.48615264892578
nll mean: 117.76402282714844 	 kl mean: 0.9688363671302795 	 loss mean: 118.73286437988281
nll mean: 117.59715270996094 	 kl mean: 0.9688363671302795 	 loss mean: 118.56597900390625
nll mean: 117.726318359375 	 kl mean: 0.9688363671302795 	 loss mean: 118.69514465332031



  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.96it/s][A
                                      .65it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .65it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .65it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 25.65it/s][A
                                      .45it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 25.23it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 117.67505645751953 	 kl mean: 0.9688363671302795 	 loss mean: 118.64389038085938
nll mean: 117.54450988769531 	 kl mean: 0.9688363671302795 	 loss mean: 118.51335144042969
nll mean: 117.77936553955078 	 kl mean: 0.9688363671302795 	 loss mean: 118.74819946289062
nll mean: 117.75244903564453 	 kl mean: 0.9688363671302795 	 loss mean: 118.72128295898438
nll mean: 117.71883392333984 	 kl mean: 0.9688363671302795 	 loss mean: 118.68766784667969


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
 20%|██        | 2/10 [00:00<00:00, 13.78it/s][A

nll mean: 132.8203125 	 kl mean: 1.1576950550079346 	 loss mean: 133.97799682617188
nll mean: 133.0897979736328 	 kl mean: 1.1576950550079346 	 loss mean: 134.24749755859375
nll mean: 132.98362731933594 	 kl mean: 1.1576950550079346 	 loss mean: 134.1413116455078


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
 20%|██        | 2/10 [00:00<00:00, 13.78it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
 40%|████      | 4/10 [00:00<00:00, 13.81it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.94it/s][A

nll mean: 132.9320068359375 	 kl mean: 1.1576950550079346 	 loss mean: 134.08970642089844
nll mean: 132.89376831054688 	 kl mean: 1.1576950550079346 	 loss mean: 134.0514678955078
nll mean: 132.87466430664062 	 kl mean: 1.1576950550079346 	 loss mean: 134.0323486328125


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.94it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.51it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.99it/s][A

nll mean: 132.90879821777344 	 kl mean: 1.1576950550079346 	 loss mean: 134.06649780273438
nll mean: 132.79498291015625 	 kl mean: 1.1576950550079346 	 loss mean: 133.95269775390625
nll mean: 133.03604125976562 	 kl mean: 1.1576950550079346 	 loss mean: 134.1937255859375


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.51it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.99it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.99it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
 30%|███       | 3/10 [00:00<00:00, 25.20it/s][A

nll mean: 132.89462280273438 	 kl mean: 1.1576950550079346 	 loss mean: 134.05233764648438
nll mean: 105.58528137207031 	 kl mean: 0.9987717866897583 	 loss mean: 106.58404541015625
nll mean: 105.73530578613281 	 kl mean: 0.9987717866897583 	 loss mean: 106.73408508300781
nll mean: 105.58651733398438 	 kl mean: 0.9987717866897583 	 loss mean: 106.58528900146484
nll mean: 106.03214263916016 	 kl mean: 0.9987717866897583 	 loss mean: 107.03092193603516


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
 30%|███       | 3/10 [00:00<00:00, 25.20it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.85it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.49it/s][A

nll mean: 105.53480529785156 	 kl mean: 0.9987717866897583 	 loss mean: 106.53357696533203
nll mean: 105.54147338867188 	 kl mean: 0.9987717866897583 	 loss mean: 106.54024505615234
nll mean: 105.43331909179688 	 kl mean: 0.9987717866897583 	 loss mean: 106.43209838867188
nll mean: 105.69561004638672 	 kl mean: 0.9987717866897583 	 loss mean: 106.69438171386719
nll mean: 105.94120788574219 	 kl mean: 0.9987717866897583 	 loss mean: 106.93998718261719


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
100%|██████████| 10/10 [00:00<00:00, 24.19it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.73it/s][A

nll mean: 105.37387084960938 	 kl mean: 0.9987717866897583 	 loss mean: 106.37264251708984
nll mean: 144.07476806640625 	 kl mean: 1.083130121231079 	 loss mean: 145.15789794921875
nll mean: 143.8453369140625 	 kl mean: 1.083130121231079 	 loss mean: 144.928466796875


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
 20%|██        | 2/10 [00:00<00:00, 10.73it/s][A
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
 40%|████      | 4/10 [00:00<00:00, 10.73it/s][A

nll mean: 143.8215789794922 	 kl mean: 1.083130121231079 	 loss mean: 144.9047088623047
nll mean: 144.1128692626953 	 kl mean: 1.083130121231079 	 loss mean: 145.19598388671875
nll mean: 143.88717651367188 	 kl mean: 1.083130121231079 	 loss mean: 144.97030639648438


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
 40%|████      | 4/10 [00:00<00:00, 10.73it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.78it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.78it/s][A

nll mean: 143.764892578125 	 kl mean: 1.083130121231079 	 loss mean: 144.8480224609375
nll mean: 143.93179321289062 	 kl mean: 1.083130121231079 	 loss mean: 145.0149383544922
nll mean: 143.91030883789062 	 kl mean: 1.083130121231079 	 loss mean: 144.99343872070312


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.78it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.76it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 143.88265991210938 	 kl mean: 1.083130121231079 	 loss mean: 144.96578979492188
nll mean: 143.83859252929688 	 kl mean: 1.083130121231079 	 loss mean: 144.92173767089844
nll mean: 131.04034423828125 	 kl mean: 1.0072650909423828 	 loss mean: 132.047607421875


                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 20%|██        | 2/10 [00:00<00:00, 14.29it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.12it/s][A

nll mean: 131.0803680419922 	 kl mean: 1.0072650909423828 	 loss mean: 132.087646484375
nll mean: 131.0639190673828 	 kl mean: 1.0072650909423828 	 loss mean: 132.07118225097656
nll mean: 131.19476318359375 	 kl mean: 1.0072650909423828 	 loss mean: 132.2020263671875


                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 40%|████      | 4/10 [00:00<00:00, 14.12it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.15it/s][A

nll mean: 131.27304077148438 	 kl mean: 1.0072650909423828 	 loss mean: 132.28030395507812
nll mean: 130.8708038330078 	 kl mean: 1.0072650909423828 	 loss mean: 131.87806701660156
nll mean: 131.0043182373047 	 kl mean: 1.0072650909423828 	 loss mean: 132.0115966796875


                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.15it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.14it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.06it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 131.17709350585938 	 kl mean: 1.0072650909423828 	 loss mean: 132.18435668945312
nll mean: 130.97119140625 	 kl mean: 1.0072650909423828 	 loss mean: 131.9784698486328
nll mean: 130.95816040039062 	 kl mean: 1.0072650909423828 	 loss mean: 131.96542358398438


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.52it/s][A

nll mean: 129.58021545410156 	 kl mean: 1.0444430112838745 	 loss mean: 130.62466430664062
nll mean: 129.89691162109375 	 kl mean: 1.0444430112838745 	 loss mean: 130.9413604736328
nll mean: 129.74661254882812 	 kl mean: 1.0444430112838745 	 loss mean: 130.79104614257812


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.52it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 40%|████      | 4/10 [00:00<00:00, 14.32it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.50it/s][A

nll mean: 129.71771240234375 	 kl mean: 1.0444430112838745 	 loss mean: 130.7621612548828
nll mean: 129.65283203125 	 kl mean: 1.0444430112838745 	 loss mean: 130.697265625
nll mean: 129.47744750976562 	 kl mean: 1.0444430112838745 	 loss mean: 130.52188110351562


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.50it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.46it/s][A

nll mean: 129.63705444335938 	 kl mean: 1.0444430112838745 	 loss mean: 130.68148803710938
nll mean: 129.5839385986328 	 kl mean: 1.0444430112838745 	 loss mean: 130.6283721923828
nll mean: 129.50425720214844 	 kl mean: 1.0444430112838745 	 loss mean: 130.5487060546875


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.35it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
[A                                           

nll mean: 129.74270629882812 	 kl mean: 1.0444430112838745 	 loss mean: 130.78713989257812
nll mean: 140.10800170898438 	 kl mean: 0.9084093570709229 	 loss mean: 141.01641845703125
nll mean: 140.15545654296875 	 kl mean: 0.9084093570709229 	 loss mean: 141.06387329101562
nll mean: 140.05426025390625 	 kl mean: 0.9084093570709229 	 loss mean: 140.96267700195312
nll mean: 140.1176300048828 	 kl mean: 0.9084093570709229 	 loss mean: 141.0260467529297


 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 25.69it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.43it/s][A
                                              [A

nll mean: 140.03790283203125 	 kl mean: 0.9084093570709229 	 loss mean: 140.94630432128906
nll mean: 140.09829711914062 	 kl mean: 0.9084093570709229 	 loss mean: 141.0067138671875
nll mean: 140.13735961914062 	 kl mean: 0.9084093570709229 	 loss mean: 141.0457763671875
nll mean: 140.2003173828125 	 kl mean: 0.9084093570709229 	 loss mean: 141.10873413085938
nll mean: 140.2541046142578 	 kl mean: 0.9084093570709229 	 loss mean: 141.16250610351562



 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
100%|██████████| 10/10 [00:00<00:00, 25.08it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              [A

nll mean: 140.27578735351562 	 kl mean: 0.9084093570709229 	 loss mean: 141.1842041015625
nll mean: 111.19271087646484 	 kl mean: 1.074345350265503 	 loss mean: 112.26705932617188
nll mean: 111.06791687011719 	 kl mean: 1.074345350265503 	 loss mean: 112.14225769042969
nll mean: 111.076416015625 	 kl mean: 1.074345350265503 	 loss mean: 112.15076446533203
nll mean: 111.30296325683594 	 kl mean: 1.074345350265503 	 loss mean: 112.3772964477539



 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
 30%|███       | 3/10 [00:00<00:00, 25.35it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.18it/s][A
                                              [A

nll mean: 111.0767593383789 	 kl mean: 1.074345350265503 	 loss mean: 112.15110778808594
nll mean: 111.11079406738281 	 kl mean: 1.074345350265503 	 loss mean: 112.18513488769531
nll mean: 111.2571029663086 	 kl mean: 1.074345350265503 	 loss mean: 112.33145141601562
nll mean: 111.09683227539062 	 kl mean: 1.074345350265503 	 loss mean: 112.17117309570312
nll mean: 111.29679870605469 	 kl mean: 1.074345350265503 	 loss mean: 112.37113952636719



 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
100%|██████████| 10/10 [00:00<00:00, 24.99it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.38it/s][A

nll mean: 111.0062026977539 	 kl mean: 1.074345350265503 	 loss mean: 112.08055114746094
nll mean: 137.6458740234375 	 kl mean: 1.07753324508667 	 loss mean: 138.72340393066406
nll mean: 137.5786590576172 	 kl mean: 1.07753324508667 	 loss mean: 138.65618896484375


                                              
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
 20%|██        | 2/10 [00:00<00:00, 14.38it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
 40%|████      | 4/10 [00:00<00:00, 14.46it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.79it/s][A

nll mean: 137.5770721435547 	 kl mean: 1.07753324508667 	 loss mean: 138.65460205078125
nll mean: 137.78958129882812 	 kl mean: 1.07753324508667 	 loss mean: 138.86712646484375
nll mean: 137.65481567382812 	 kl mean: 1.07753324508667 	 loss mean: 138.73233032226562
nll mean: 137.80348205566406 	 kl mean: 1.07753324508667 	 loss mean: 138.88101196289062


                                              
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.79it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.60it/s][A

nll mean: 137.677490234375 	 kl mean: 1.07753324508667 	 loss mean: 138.75502014160156
nll mean: 137.74166870117188 	 kl mean: 1.07753324508667 	 loss mean: 138.81919860839844
nll mean: 137.4480743408203 	 kl mean: 1.07753324508667 	 loss mean: 138.52560424804688


                                              
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.60it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.62it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.92it/s][A

nll mean: 137.5770263671875 	 kl mean: 1.07753324508667 	 loss mean: 138.654541015625
nll mean: 137.79446411132812 	 kl mean: 0.9060052037239075 	 loss mean: 138.70046997070312
nll mean: 137.91513061523438 	 kl mean: 0.9060052037239075 	 loss mean: 138.82113647460938
nll mean: 137.80665588378906 	 kl mean: 0.9060052037239075 	 loss mean: 138.712646484375
nll mean: 137.95352172851562 	 kl mean: 0.9060052037239075 	 loss mean: 138.85952758789062


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.92it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 50%|█████     | 5/10 [00:00<00:00, 21.27it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 80%|████████  | 8/10 [00:00<00:00, 21.17it/s][A

nll mean: 137.85928344726562 	 kl mean: 0.9060052037239075 	 loss mean: 138.76528930664062
nll mean: 137.96234130859375 	 kl mean: 0.9060052037239075 	 loss mean: 138.86834716796875
nll mean: 137.85499572753906 	 kl mean: 0.9060052037239075 	 loss mean: 138.76100158691406
nll mean: 137.85772705078125 	 kl mean: 0.9060052037239075 	 loss mean: 138.76373291015625
nll mean: 137.8642578125 	 kl mean: 0.9060052037239075 	 loss mean: 138.770263671875


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
100%|██████████| 10/10 [00:00<00:00, 20.96it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
 30%|███       | 3/10 [00:00<00:00, 24.76it/s][A

nll mean: 137.83148193359375 	 kl mean: 0.9060052037239075 	 loss mean: 138.73748779296875
nll mean: 124.68232727050781 	 kl mean: 1.2521343231201172 	 loss mean: 125.93446350097656
nll mean: 124.8683853149414 	 kl mean: 1.2521343231201172 	 loss mean: 126.12052917480469
nll mean: 124.80632019042969 	 kl mean: 1.2521343231201172 	 loss mean: 126.05845642089844
nll mean: 124.80696868896484 	 kl mean: 1.2521343231201172 	 loss mean: 126.05911254882812


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
 30%|███       | 3/10 [00:00<00:00, 24.76it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.68it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.69it/s][A

nll mean: 124.86632537841797 	 kl mean: 1.2521343231201172 	 loss mean: 126.11846923828125
nll mean: 125.00663757324219 	 kl mean: 1.2521343231201172 	 loss mean: 126.25878143310547
nll mean: 124.74390411376953 	 kl mean: 1.2521343231201172 	 loss mean: 125.99603271484375
nll mean: 125.03265380859375 	 kl mean: 1.2521343231201172 	 loss mean: 126.2847900390625
nll mean: 124.57098388671875 	 kl mean: 1.2521343231201172 	 loss mean: 125.8231201171875


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
100%|██████████| 10/10 [00:00<00:00, 24.62it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
 30%|███       | 3/10 [00:00<00:00, 21.28it/s][A

nll mean: 124.85964965820312 	 kl mean: 1.2521343231201172 	 loss mean: 126.11178588867188
nll mean: 146.7062530517578 	 kl mean: 1.1081502437591553 	 loss mean: 147.81439208984375
nll mean: 146.63372802734375 	 kl mean: 1.1081502437591553 	 loss mean: 147.74188232421875
nll mean: 146.80422973632812 	 kl mean: 1.1081502437591553 	 loss mean: 147.91238403320312
nll mean: 147.11363220214844 	 kl mean: 1.1081502437591553 	 loss mean: 148.22177124023438


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
 30%|███       | 3/10 [00:00<00:00, 21.28it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.33it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.35it/s][A

nll mean: 146.82388305664062 	 kl mean: 1.1081502437591553 	 loss mean: 147.93203735351562
nll mean: 147.00930786132812 	 kl mean: 1.1081502437591553 	 loss mean: 148.11746215820312
nll mean: 146.93972778320312 	 kl mean: 1.1081502437591553 	 loss mean: 148.04788208007812
nll mean: 146.98411560058594 	 kl mean: 1.1081502437591553 	 loss mean: 148.09226989746094
nll mean: 146.94174194335938 	 kl mean: 1.1081502437591553 	 loss mean: 148.04989624023438


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
100%|██████████| 10/10 [00:00<00:00, 21.38it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.20it/s][A

nll mean: 146.98126220703125 	 kl mean: 1.1081502437591553 	 loss mean: 148.08941650390625
nll mean: 124.41777038574219 	 kl mean: 1.2766470909118652 	 loss mean: 125.69440460205078
nll mean: 124.51666259765625 	 kl mean: 1.2766470909118652 	 loss mean: 125.79331970214844


                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 20%|██        | 2/10 [00:00<00:00, 12.20it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 40%|████      | 4/10 [00:00<00:00, 12.27it/s][A

nll mean: 124.5975570678711 	 kl mean: 1.2766470909118652 	 loss mean: 125.87420654296875
nll mean: 124.64933013916016 	 kl mean: 1.2766470909118652 	 loss mean: 125.92597961425781
nll mean: 124.43824768066406 	 kl mean: 1.2766470909118652 	 loss mean: 125.71489715576172


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 40%|████      | 4/10 [00:00<00:00, 12.27it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.33it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.56it/s][A

nll mean: 124.33809661865234 	 kl mean: 1.2766470909118652 	 loss mean: 125.61473083496094
nll mean: 124.64974212646484 	 kl mean: 1.2766470909118652 	 loss mean: 125.9263916015625
nll mean: 124.34953308105469 	 kl mean: 1.2766470909118652 	 loss mean: 125.62617492675781


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.56it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.62it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.48243713378906 	 kl mean: 1.2766470909118652 	 loss mean: 125.75908660888672
nll mean: 124.60771942138672 	 kl mean: 1.2766470909118652 	 loss mean: 125.88436889648438
nll mean: 167.10321044921875 	 kl mean: 1.2033904790878296 	 loss mean: 168.30657958984375


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 20%|██        | 2/10 [00:00<00:00, 10.21it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.09it/s][A

nll mean: 167.23574829101562 	 kl mean: 1.2033904790878296 	 loss mean: 168.43914794921875
nll mean: 166.87240600585938 	 kl mean: 1.2033904790878296 	 loss mean: 168.0758056640625


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 10.09it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 40%|████      | 4/10 [00:00<00:00, 10.03it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.06it/s][A

nll mean: 167.2566375732422 	 kl mean: 1.2033904790878296 	 loss mean: 168.46002197265625
nll mean: 167.3035888671875 	 kl mean: 1.2033904790878296 	 loss mean: 168.5069580078125
nll mean: 167.46377563476562 	 kl mean: 1.2033904790878296 	 loss mean: 168.66717529296875


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.06it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.12it/s][A

nll mean: 166.80709838867188 	 kl mean: 1.2033904790878296 	 loss mean: 168.010498046875
nll mean: 167.00390625 	 kl mean: 1.2033904790878296 	 loss mean: 168.20730590820312
nll mean: 166.9935302734375 	 kl mean: 1.2033904790878296 	 loss mean: 168.19692993164062


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.12it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.11it/s][A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 20%|██        | 2/10 [00:00<00:00, 18.36it/s][A

nll mean: 167.03692626953125 	 kl mean: 1.2033904790878296 	 loss mean: 168.2403106689453
nll mean: 141.02072143554688 	 kl mean: 1.0181245803833008 	 loss mean: 142.03884887695312
nll mean: 140.9019775390625 	 kl mean: 1.0181245803833008 	 loss mean: 141.92010498046875
nll mean: 140.92904663085938 	 kl mean: 1.0181245803833008 	 loss mean: 141.94717407226562


                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 20%|██        | 2/10 [00:00<00:00, 18.36it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 40%|████      | 4/10 [00:00<00:00, 18.15it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 60%|██████    | 6/10 [00:00<00:00, 18.19it/s][A

nll mean: 141.02813720703125 	 kl mean: 1.0181245803833008 	 loss mean: 142.0462646484375
nll mean: 141.30227661132812 	 kl mean: 1.0181245803833008 	 loss mean: 142.32040405273438
nll mean: 141.15670776367188 	 kl mean: 1.0181245803833008 	 loss mean: 142.17481994628906
nll mean: 141.22540283203125 	 kl mean: 1.0181245803833008 	 loss mean: 142.2435302734375


                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 60%|██████    | 6/10 [00:00<00:00, 18.19it/s][A
                                               [A
 37%|███▋      | 14/38 [00:09<00:16,  1.41it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:16,  1.41it/s]
 80%|████████  | 8/10 [00:00<00:00, 18.15it/s][A
100%|██████████| 10/10 [00:00<00:00, 18.09it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 141.1520233154297 	 kl mean: 1.0181245803833008 	 loss mean: 142.17015075683594
nll mean: 141.1668701171875 	 kl mean: 1.0181245803833008 	 loss mean: 142.1849822998047
nll mean: 141.0743408203125 	 kl mean: 1.0181245803833008 	 loss mean: 142.09246826171875


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 20%|██        | 2/10 [00:00<00:00, 10.85it/s][A

nll mean: 149.3404541015625 	 kl mean: 1.157757043838501 	 loss mean: 150.49822998046875
nll mean: 149.45050048828125 	 kl mean: 1.157757043838501 	 loss mean: 150.60824584960938
nll mean: 149.31851196289062 	 kl mean: 1.157757043838501 	 loss mean: 150.4762725830078


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 20%|██        | 2/10 [00:00<00:00, 10.85it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 40%|████      | 4/10 [00:00<00:00, 10.88it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.87it/s][A

nll mean: 149.28244018554688 	 kl mean: 1.157757043838501 	 loss mean: 150.44021606445312
nll mean: 149.0374298095703 	 kl mean: 1.157757043838501 	 loss mean: 150.1951904296875
nll mean: 149.34344482421875 	 kl mean: 1.157757043838501 	 loss mean: 150.50120544433594


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.87it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.84it/s][A

nll mean: 149.27032470703125 	 kl mean: 1.157757043838501 	 loss mean: 150.4281005859375
nll mean: 149.353271484375 	 kl mean: 1.157757043838501 	 loss mean: 150.51101684570312
nll mean: 149.28271484375 	 kl mean: 1.157757043838501 	 loss mean: 150.44049072265625


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.84it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.81it/s][A
 42%|████▏     | 16/38 [00:09<00:16,  1.35it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
 30%|███       | 3/10 [00:00<00:00, 24.82it/s][A

nll mean: 149.14891052246094 	 kl mean: 1.157757043838501 	 loss mean: 150.30665588378906
nll mean: 150.43881225585938 	 kl mean: 0.9486849308013916 	 loss mean: 151.38748168945312
nll mean: 150.22872924804688 	 kl mean: 0.9486849308013916 	 loss mean: 151.17739868164062
nll mean: 150.29568481445312 	 kl mean: 0.9486849308013916 	 loss mean: 151.244384765625
nll mean: 149.94735717773438 	 kl mean: 0.9486849308013916 	 loss mean: 150.89602661132812


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
 30%|███       | 3/10 [00:00<00:00, 24.82it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.67it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.54it/s][A

nll mean: 150.22555541992188 	 kl mean: 0.9486849308013916 	 loss mean: 151.1742401123047
nll mean: 150.21652221679688 	 kl mean: 0.9486849308013916 	 loss mean: 151.1652069091797
nll mean: 150.35855102539062 	 kl mean: 0.9486849308013916 	 loss mean: 151.30723571777344
nll mean: 150.23394775390625 	 kl mean: 0.9486849308013916 	 loss mean: 151.1826171875
nll mean: 150.208251953125 	 kl mean: 0.9486849308013916 	 loss mean: 151.15692138671875


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.35it/s]
100%|██████████| 10/10 [00:00<00:00, 24.36it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
 30%|███       | 3/10 [00:00<00:00, 24.92it/s][A

nll mean: 150.05662536621094 	 kl mean: 0.9486849308013916 	 loss mean: 151.0052947998047
nll mean: 139.45648193359375 	 kl mean: 1.0869052410125732 	 loss mean: 140.54339599609375
nll mean: 139.60842895507812 	 kl mean: 1.0869052410125732 	 loss mean: 140.69534301757812
nll mean: 139.49688720703125 	 kl mean: 1.0869052410125732 	 loss mean: 140.58380126953125
nll mean: 139.57891845703125 	 kl mean: 1.0869052410125732 	 loss mean: 140.6658172607422


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
 30%|███       | 3/10 [00:00<00:00, 24.92it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.87it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.86it/s][A

nll mean: 139.4740753173828 	 kl mean: 1.0869052410125732 	 loss mean: 140.56097412109375
nll mean: 139.7296905517578 	 kl mean: 1.0869052410125732 	 loss mean: 140.8166046142578
nll mean: 139.21743774414062 	 kl mean: 1.0869052410125732 	 loss mean: 140.30433654785156
nll mean: 139.28726196289062 	 kl mean: 1.0869052410125732 	 loss mean: 140.37417602539062
nll mean: 139.49575805664062 	 kl mean: 1.0869052410125732 	 loss mean: 140.58267211914062


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.56it/s]
100%|██████████| 10/10 [00:00<00:00, 24.82it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.40it/s][A

nll mean: 139.2669677734375 	 kl mean: 1.0869052410125732 	 loss mean: 140.35386657714844
nll mean: 136.8785400390625 	 kl mean: 1.1099956035614014 	 loss mean: 137.98854064941406
nll mean: 136.97434997558594 	 kl mean: 1.1099956035614014 	 loss mean: 138.08433532714844


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 20%|██        | 2/10 [00:00<00:00, 12.40it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 40%|████      | 4/10 [00:00<00:00, 12.58it/s][A

nll mean: 136.97262573242188 	 kl mean: 1.1099956035614014 	 loss mean: 138.08261108398438
nll mean: 136.96591186523438 	 kl mean: 1.1099956035614014 	 loss mean: 138.07591247558594
nll mean: 136.765625 	 kl mean: 1.1099956035614014 	 loss mean: 137.8756103515625


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 40%|████      | 4/10 [00:00<00:00, 12.58it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.56it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.67it/s][A

nll mean: 136.8324737548828 	 kl mean: 1.1099956035614014 	 loss mean: 137.9424591064453
nll mean: 136.8931884765625 	 kl mean: 1.1099956035614014 	 loss mean: 138.003173828125
nll mean: 136.81431579589844 	 kl mean: 1.1099956035614014 	 loss mean: 137.92431640625


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.67it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.71it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 136.91033935546875 	 kl mean: 1.1099956035614014 	 loss mean: 138.02035522460938
nll mean: 136.7830810546875 	 kl mean: 1.1099956035614014 	 loss mean: 137.89306640625
nll mean: 154.38189697265625 	 kl mean: 0.9403766989707947 	 loss mean: 155.322265625


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 12.66it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.79it/s][A

nll mean: 154.40777587890625 	 kl mean: 0.9403766989707947 	 loss mean: 155.34814453125
nll mean: 154.4192352294922 	 kl mean: 0.9403766989707947 	 loss mean: 155.359619140625
nll mean: 154.28208923339844 	 kl mean: 0.9403766989707947 	 loss mean: 155.22247314453125


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
 40%|████      | 4/10 [00:00<00:00, 12.79it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.76it/s][A

nll mean: 154.39682006835938 	 kl mean: 0.9403766989707947 	 loss mean: 155.33718872070312
nll mean: 154.49038696289062 	 kl mean: 0.9403766989707947 	 loss mean: 155.43075561523438
nll mean: 154.49444580078125 	 kl mean: 0.9403766989707947 	 loss mean: 155.43482971191406


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.76it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.70it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.73it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 154.33529663085938 	 kl mean: 0.9403766989707947 	 loss mean: 155.27566528320312
nll mean: 154.27346801757812 	 kl mean: 0.9403766989707947 	 loss mean: 155.21385192871094
nll mean: 154.4383087158203 	 kl mean: 0.9403766989707947 	 loss mean: 155.37869262695312


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
 20%|██        | 2/10 [00:00<00:00, 13.22it/s][A

nll mean: 163.10220336914062 	 kl mean: 0.9648629426956177 	 loss mean: 164.0670623779297
nll mean: 163.27191162109375 	 kl mean: 0.9648629426956177 	 loss mean: 164.2367706298828
nll mean: 162.96340942382812 	 kl mean: 0.9648629426956177 	 loss mean: 163.9282684326172


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
 20%|██        | 2/10 [00:00<00:00, 13.22it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
 40%|████      | 4/10 [00:00<00:00, 13.01it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.84it/s][A

nll mean: 162.9671630859375 	 kl mean: 0.9648629426956177 	 loss mean: 163.93202209472656
nll mean: 163.1263885498047 	 kl mean: 0.9648629426956177 	 loss mean: 164.09124755859375
nll mean: 163.00885009765625 	 kl mean: 0.9648629426956177 	 loss mean: 163.97369384765625


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.47it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.47it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.84it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.72it/s][A

nll mean: 162.85386657714844 	 kl mean: 0.9648629426956177 	 loss mean: 163.8187255859375
nll mean: 162.9937744140625 	 kl mean: 0.9648629426956177 	 loss mean: 163.95863342285156
nll mean: 163.03013610839844 	 kl mean: 0.9648629426956177 	 loss mean: 163.9949951171875


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.72it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.59it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               


nll mean: 163.02561950683594 	 kl mean: 0.9648629426956177 	 loss mean: 163.99049377441406
nll mean: 123.0644760131836 	 kl mean: 1.1146986484527588 	 loss mean: 124.1791763305664


 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 10.11it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.12it/s][A

nll mean: 123.11924743652344 	 kl mean: 1.1146986484527588 	 loss mean: 124.23394775390625
nll mean: 123.32815551757812 	 kl mean: 1.1146986484527588 	 loss mean: 124.44286346435547
nll mean: 123.63296508789062 	 kl mean: 1.1146986484527588 	 loss mean: 124.74767303466797


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 10.12it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.15it/s][A

nll mean: 123.23016357421875 	 kl mean: 1.1146986484527588 	 loss mean: 124.3448715209961
nll mean: 123.308837890625 	 kl mean: 1.1146986484527588 	 loss mean: 124.42353057861328
nll mean: 123.41667938232422 	 kl mean: 1.1146986484527588 	 loss mean: 124.53137969970703


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.15it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.40it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.16it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.17it/s][A

nll mean: 123.71443176269531 	 kl mean: 1.1146986484527588 	 loss mean: 124.82913208007812
nll mean: 123.287841796875 	 kl mean: 1.1146986484527588 	 loss mean: 124.40254211425781
nll mean: 123.43106079101562 	 kl mean: 1.1146986484527588 	 loss mean: 124.54576873779297


100%|██████████| 10/10 [00:00<00:00, 10.16it/s]
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 32.72it/s][A

nll mean: 112.88006591796875 	 kl mean: 0.7758998870849609 	 loss mean: 113.65596008300781
nll mean: 112.55424499511719 	 kl mean: 0.7758998870849609 	 loss mean: 113.33015441894531
nll mean: 112.61412048339844 	 kl mean: 0.7758998870849609 	 loss mean: 113.39002227783203
nll mean: 112.98602294921875 	 kl mean: 0.7758998870849609 	 loss mean: 113.76191711425781
nll mean: 112.63652038574219 	 kl mean: 0.7758998870849609 	 loss mean: 113.41242218017578
nll mean: 112.79309844970703 	 kl mean: 0.7758998870849609 	 loss mean: 113.56900024414062
nll mean: 112.68299102783203 	 kl mean: 0.7758998870849609 	 loss mean: 113.45889282226562


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 32.72it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
100%|██████████| 10/10 [00:00<00:00, 32.34it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 112.7288818359375 	 kl mean: 0.7758998870849609 	 loss mean: 113.50477600097656
nll mean: 112.44351196289062 	 kl mean: 0.7758998870849609 	 loss mean: 113.21940612792969
nll mean: 112.56349182128906 	 kl mean: 0.7758998870849609 	 loss mean: 113.33938598632812
nll mean: 163.2419891357422 	 kl mean: 0.8547736406326294 	 loss mean: 164.09677124023438


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.57it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.63it/s][A

nll mean: 163.3383331298828 	 kl mean: 0.8547736406326294 	 loss mean: 164.19309997558594
nll mean: 163.22723388671875 	 kl mean: 0.8547736406326294 	 loss mean: 164.08200073242188
nll mean: 163.10562133789062 	 kl mean: 0.8547736406326294 	 loss mean: 163.9604034423828


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 40%|████      | 4/10 [00:00<00:00, 14.63it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.61it/s][A

nll mean: 163.16915893554688 	 kl mean: 0.8547736406326294 	 loss mean: 164.02394104003906
nll mean: 163.1151580810547 	 kl mean: 0.8547736406326294 	 loss mean: 163.96990966796875
nll mean: 163.09747314453125 	 kl mean: 0.8547736406326294 	 loss mean: 163.95223999023438


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.61it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.67it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.68it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 163.17767333984375 	 kl mean: 0.8547736406326294 	 loss mean: 164.03244018554688
nll mean: 163.38150024414062 	 kl mean: 0.8547736406326294 	 loss mean: 164.2362823486328
nll mean: 163.27574157714844 	 kl mean: 0.8547736406326294 	 loss mean: 164.1304931640625
nll mean: 127.17728424072266 	 kl mean: 1.0423630475997925 	 loss mean: 128.2196502685547


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 22.09it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.01it/s][A

nll mean: 127.26510620117188 	 kl mean: 1.0423630475997925 	 loss mean: 128.30746459960938
nll mean: 127.34884643554688 	 kl mean: 1.0423630475997925 	 loss mean: 128.39120483398438
nll mean: 127.31085205078125 	 kl mean: 1.0423630475997925 	 loss mean: 128.35321044921875
nll mean: 127.27283477783203 	 kl mean: 1.0423630475997925 	 loss mean: 128.31520080566406
nll mean: 127.30455017089844 	 kl mean: 1.0423630475997925 	 loss mean: 128.346923828125


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.01it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 21.67it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 127.46482849121094 	 kl mean: 1.0423630475997925 	 loss mean: 128.5072021484375
nll mean: 127.38192749023438 	 kl mean: 1.0423630475997925 	 loss mean: 128.42430114746094
nll mean: 127.34159851074219 	 kl mean: 1.0423630475997925 	 loss mean: 128.3839569091797
nll mean: 127.23072052001953 	 kl mean: 1.0423630475997925 	 loss mean: 128.27308654785156


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 14.61it/s]

nll mean: 120.2663803100586 	 kl mean: 1.0313160419464111 	 loss mean: 121.29769134521484
nll mean: 120.32610321044922 	 kl mean: 1.0313160419464111 	 loss mean: 121.35742950439453
nll mean: 120.40655517578125 	 kl mean: 1.0313160419464111 	 loss mean: 121.43787384033203
nll mean: 120.06908416748047 	 kl mean: 1.0313160419464111 	 loss mean: 121.10041046142578


[A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 40%|████      | 4/10 [00:00<00:00, 14.72it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.80it/s][A

nll mean: 120.25743865966797 	 kl mean: 1.0313160419464111 	 loss mean: 121.28874969482422
nll mean: 120.2514419555664 	 kl mean: 1.0313160419464111 	 loss mean: 121.28274536132812
nll mean: 120.20805358886719 	 kl mean: 1.0313160419464111 	 loss mean: 121.23937225341797


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.80it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.80it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.75it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.06346130371094 	 kl mean: 1.0313160419464111 	 loss mean: 121.09477233886719
nll mean: 120.10914611816406 	 kl mean: 1.0313160419464111 	 loss mean: 121.14047241210938
nll mean: 120.11964416503906 	 kl mean: 1.0313160419464111 	 loss mean: 121.15095520019531
nll mean: 87.26759338378906 	 kl mean: 1.026954174041748 	 loss mean: 88.29454803466797


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00, 22.36it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.60it/s][A

nll mean: 87.13811492919922 	 kl mean: 1.026954174041748 	 loss mean: 88.16506958007812
nll mean: 87.33317565917969 	 kl mean: 1.026954174041748 	 loss mean: 88.3601303100586
nll mean: 87.00601959228516 	 kl mean: 1.026954174041748 	 loss mean: 88.03297424316406
nll mean: 87.06692504882812 	 kl mean: 1.026954174041748 	 loss mean: 88.09387969970703
nll mean: 86.94644927978516 	 kl mean: 1.026954174041748 	 loss mean: 87.97340393066406


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.60it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
100%|██████████| 10/10 [00:00<00:00, 22.79it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 86.98173522949219 	 kl mean: 1.026954174041748 	 loss mean: 88.00868225097656
nll mean: 87.0439682006836 	 kl mean: 1.026954174041748 	 loss mean: 88.0709228515625
nll mean: 87.01536560058594 	 kl mean: 1.026954174041748 	 loss mean: 88.04232025146484
nll mean: 87.18359375 	 kl mean: 1.026954174041748 	 loss mean: 88.21055603027344
nll mean: 113.3564453125 	 kl mean: 0.8794400691986084 	 loss mean: 114.23588562011719


                                               
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.75it/s]
 30%|███       | 3/10 [00:00<00:00, 21.47it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.50it/s][A

nll mean: 113.56963348388672 	 kl mean: 0.8794400691986084 	 loss mean: 114.44906616210938
nll mean: 113.76937103271484 	 kl mean: 0.8794400691986084 	 loss mean: 114.64881134033203
nll mean: 113.68975830078125 	 kl mean: 0.8794400691986084 	 loss mean: 114.56919860839844
nll mean: 113.45988464355469 	 kl mean: 0.8794400691986084 	 loss mean: 114.33932495117188
nll mean: 113.66324615478516 	 kl mean: 0.8794400691986084 	 loss mean: 114.54267883300781


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.75it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.75it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.75it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.50it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.75it/s]
100%|██████████| 10/10 [00:00<00:00, 21.50it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 113.44506072998047 	 kl mean: 0.8794400691986084 	 loss mean: 114.32449340820312
nll mean: 113.44194793701172 	 kl mean: 0.8794400691986084 	 loss mean: 114.3213882446289
nll mean: 113.53654479980469 	 kl mean: 0.8794400691986084 	 loss mean: 114.41598510742188
nll mean: 113.53385925292969 	 kl mean: 0.8794400691986084 	 loss mean: 114.41329956054688


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 20%|██        | 2/10 [00:00<00:00, 12.40it/s][A

nll mean: 127.64478302001953 	 kl mean: 0.9559108018875122 	 loss mean: 128.6007080078125
nll mean: 127.6726303100586 	 kl mean: 0.9559108018875122 	 loss mean: 128.6285400390625
nll mean: 127.70294189453125 	 kl mean: 0.9559108018875122 	 loss mean: 128.65887451171875


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 20%|██        | 2/10 [00:00<00:00, 12.40it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 40%|████      | 4/10 [00:00<00:00, 12.34it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.51it/s][A

nll mean: 127.77566528320312 	 kl mean: 0.9559108018875122 	 loss mean: 128.7315673828125
nll mean: 127.63615417480469 	 kl mean: 0.9559108018875122 	 loss mean: 128.59207153320312
nll mean: 127.84223937988281 	 kl mean: 0.9559108018875122 	 loss mean: 128.7981414794922


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.51it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.58it/s][A

nll mean: 127.77626037597656 	 kl mean: 0.9559108018875122 	 loss mean: 128.732177734375
nll mean: 127.60188293457031 	 kl mean: 0.9559108018875122 	 loss mean: 128.55780029296875
nll mean: 127.66304016113281 	 kl mean: 0.9559108018875122 	 loss mean: 128.6189422607422


                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.85it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.58it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.57it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 127.69063568115234 	 kl mean: 0.9559108018875122 	 loss mean: 128.64654541015625
nll mean: 67.48973083496094 	 kl mean: 1.5847899913787842 	 loss mean: 69.07452392578125


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
 20%|██        | 2/10 [00:00<00:00, 10.08it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.96it/s][A

nll mean: 67.42036437988281 	 kl mean: 1.5847899913787842 	 loss mean: 69.00515747070312
nll mean: 67.61629486083984 	 kl mean: 1.5847899913787842 	 loss mean: 69.20108795166016


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
 30%|███       | 3/10 [00:00<00:00,  9.96it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.02it/s][A

nll mean: 67.50235748291016 	 kl mean: 1.5847899913787842 	 loss mean: 69.08714294433594
nll mean: 67.51798248291016 	 kl mean: 1.5847899913787842 	 loss mean: 69.10277557373047
nll mean: 67.58163452148438 	 kl mean: 1.5847899913787842 	 loss mean: 69.16642761230469


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.02it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.10it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 10.11it/s][A

nll mean: 67.71617889404297 	 kl mean: 1.5847899913787842 	 loss mean: 69.30097198486328
nll mean: 67.44609069824219 	 kl mean: 1.5847899913787842 	 loss mean: 69.03087615966797
nll mean: 67.37361145019531 	 kl mean: 1.5847899913787842 	 loss mean: 68.95840454101562


                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.62it/s]
100%|██████████| 10/10 [00:00<00:00, 10.11it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.79it/s][A

nll mean: 67.20309448242188 	 kl mean: 1.5847899913787842 	 loss mean: 68.78789520263672
nll mean: 109.5618896484375 	 kl mean: 1.2663366794586182 	 loss mean: 110.82821655273438
nll mean: 109.5206298828125 	 kl mean: 1.2663366794586182 	 loss mean: 110.7869644165039


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 12.79it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 40%|████      | 4/10 [00:00<00:00, 12.87it/s][A

nll mean: 109.4752426147461 	 kl mean: 1.2663366794586182 	 loss mean: 110.7415771484375
nll mean: 109.26937866210938 	 kl mean: 1.2663366794586182 	 loss mean: 110.53572082519531
nll mean: 109.3821792602539 	 kl mean: 1.2663366794586182 	 loss mean: 110.64851379394531


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 40%|████      | 4/10 [00:00<00:00, 12.87it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.86it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.79it/s][A

nll mean: 109.40187072753906 	 kl mean: 1.2663366794586182 	 loss mean: 110.66820526123047
nll mean: 109.29484558105469 	 kl mean: 1.2663366794586182 	 loss mean: 110.56117248535156
nll mean: 109.35189819335938 	 kl mean: 1.2663366794586182 	 loss mean: 110.61823272705078


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.79it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.82it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.34it/s]
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 109.28206634521484 	 kl mean: 1.2663366794586182 	 loss mean: 110.54840087890625
nll mean: 109.36973571777344 	 kl mean: 1.2663366794586182 	 loss mean: 110.63607788085938
nll mean: 144.43064880371094 	 kl mean: 1.0246469974517822 	 loss mean: 145.45529174804688


                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 20%|██        | 2/10 [00:00<00:00, 10.26it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]


nll mean: 144.4135284423828 	 kl mean: 1.0246469974517822 	 loss mean: 145.43817138671875
nll mean: 144.31973266601562 	 kl mean: 1.0246469974517822 	 loss mean: 145.34439086914062
nll mean: 144.29769897460938 	 kl mean: 1.0246469974517822 	 loss mean: 145.3223419189453


                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 10.17it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
                                               [A


nll mean: 144.48460388183594 	 kl mean: 1.0246469974517822 	 loss mean: 145.50924682617188
nll mean: 144.3668212890625 	 kl mean: 1.0246469974517822 	 loss mean: 145.39146423339844


 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.17it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.10it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.06it/s][A

nll mean: 144.37838745117188 	 kl mean: 1.0246469974517822 	 loss mean: 145.4030303955078
nll mean: 144.30117797851562 	 kl mean: 1.0246469974517822 	 loss mean: 145.3258056640625
nll mean: 144.42230224609375 	 kl mean: 1.0246469974517822 	 loss mean: 145.44696044921875


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.06it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.07it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
 30%|███       | 3/10 [00:00<00:00, 26.03it/s][A

nll mean: 144.47784423828125 	 kl mean: 1.0246469974517822 	 loss mean: 145.50247192382812
nll mean: 68.07691955566406 	 kl mean: 1.3197314739227295 	 loss mean: 69.39665222167969
nll mean: 68.29690551757812 	 kl mean: 1.3197314739227295 	 loss mean: 69.61663818359375
nll mean: 68.1906509399414 	 kl mean: 1.3197314739227295 	 loss mean: 69.51038360595703
nll mean: 68.21160888671875 	 kl mean: 1.3197314739227295 	 loss mean: 69.53134155273438
nll mean: 67.99512481689453 	 kl mean: 1.3197314739227295 	 loss mean: 69.31486511230469


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
 30%|███       | 3/10 [00:00<00:00, 26.03it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.76it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
100%|██████████| 10/10 [00:00<00:00, 25.55it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 68.19103240966797 	 kl mean: 1.3197314739227295 	 loss mean: 69.51075744628906
nll mean: 68.02919006347656 	 kl mean: 1.3197314739227295 	 loss mean: 69.34892272949219
nll mean: 68.17261505126953 	 kl mean: 1.3197314739227295 	 loss mean: 69.49234771728516
nll mean: 68.19554138183594 	 kl mean: 1.3197314739227295 	 loss mean: 69.51527404785156
nll mean: 68.20379638671875 	 kl mean: 1.3197314739227295 	 loss mean: 69.52352905273438


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 30%|███       | 3/10 [00:00<00:00, 22.14it/s][A

nll mean: 124.46500396728516 	 kl mean: 0.9289427399635315 	 loss mean: 125.3939437866211
nll mean: 124.2105484008789 	 kl mean: 0.9289427399635315 	 loss mean: 125.13948822021484
nll mean: 124.38056945800781 	 kl mean: 0.9289427399635315 	 loss mean: 125.30950927734375
nll mean: 124.15945434570312 	 kl mean: 0.9289427399635315 	 loss mean: 125.08839416503906
nll mean: 124.34254455566406 	 kl mean: 0.9289427399635315 	 loss mean: 125.271484375


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 30%|███       | 3/10 [00:00<00:00, 22.14it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.02it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
100%|██████████| 10/10 [00:00<00:00, 21.75it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.18632507324219 	 kl mean: 0.9289427399635315 	 loss mean: 125.11527252197266
nll mean: 124.50151062011719 	 kl mean: 0.9289427399635315 	 loss mean: 125.43045043945312
nll mean: 124.47733306884766 	 kl mean: 0.9289427399635315 	 loss mean: 125.40628051757812
nll mean: 124.28314208984375 	 kl mean: 0.9289427399635315 	 loss mean: 125.21208953857422
nll mean: 124.33551788330078 	 kl mean: 0.9289427399635315 	 loss mean: 125.26445770263672


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.60it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.60it/s]
 20%|██        | 2/10 [00:00<00:00, 12.59it/s][A

nll mean: 126.92115783691406 	 kl mean: 1.1086875200271606 	 loss mean: 128.02984619140625
nll mean: 126.81864929199219 	 kl mean: 1.1086875200271606 	 loss mean: 127.92733001708984
nll mean: 126.76922607421875 	 kl mean: 1.1086875200271606 	 loss mean: 127.87791442871094


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.60it/s]
 20%|██        | 2/10 [00:00<00:00, 12.59it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
 40%|████      | 4/10 [00:00<00:00, 12.60it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.63it/s][A

nll mean: 126.97354125976562 	 kl mean: 1.1086875200271606 	 loss mean: 128.0822296142578
nll mean: 126.59569549560547 	 kl mean: 1.1086875200271606 	 loss mean: 127.70437622070312
nll mean: 126.81151580810547 	 kl mean: 1.1086875200271606 	 loss mean: 127.92019653320312


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.63it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.67it/s][A

nll mean: 126.66692352294922 	 kl mean: 1.1086875200271606 	 loss mean: 127.7756118774414
nll mean: 126.63148498535156 	 kl mean: 1.1086875200271606 	 loss mean: 127.74017333984375
nll mean: 126.84367370605469 	 kl mean: 1.1086875200271606 	 loss mean: 127.95236206054688


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.67it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.68it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.77it/s][A

nll mean: 126.84210968017578 	 kl mean: 1.1086875200271606 	 loss mean: 127.95079040527344
nll mean: 118.72059631347656 	 kl mean: 1.0983141660690308 	 loss mean: 119.81891632080078
nll mean: 118.70487976074219 	 kl mean: 1.0983141660690308 	 loss mean: 119.8031997680664


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 10.77it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 10.70it/s][A

nll mean: 118.69056701660156 	 kl mean: 1.0983141660690308 	 loss mean: 119.78887939453125
nll mean: 118.58222961425781 	 kl mean: 1.0983141660690308 	 loss mean: 119.6805419921875
nll mean: 118.6798095703125 	 kl mean: 1.0983141660690308 	 loss mean: 119.77812194824219


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 10.70it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.72it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.76it/s][A

nll mean: 118.83396911621094 	 kl mean: 1.0983141660690308 	 loss mean: 119.93228149414062
nll mean: 119.00794982910156 	 kl mean: 1.0983141660690308 	 loss mean: 120.10626220703125
nll mean: 118.75723266601562 	 kl mean: 1.0983141660690308 	 loss mean: 119.85554504394531


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.76it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.71it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.91252899169922 	 kl mean: 1.0983141660690308 	 loss mean: 120.01083374023438
nll mean: 118.79090881347656 	 kl mean: 1.0983141660690308 	 loss mean: 119.88922119140625
nll mean: 117.94200897216797 	 kl mean: 1.026389479637146 	 loss mean: 118.9684066772461
nll mean: 117.87445068359375 	 kl mean: 1.026389479637146 	 loss mean: 118.90083312988281


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 23.11it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.65it/s][A

nll mean: 117.93875122070312 	 kl mean: 1.026389479637146 	 loss mean: 118.96514129638672
nll mean: 117.98503875732422 	 kl mean: 1.026389479637146 	 loss mean: 119.01142120361328
nll mean: 117.9073715209961 	 kl mean: 1.026389479637146 	 loss mean: 118.93376159667969
nll mean: 118.00385284423828 	 kl mean: 1.026389479637146 	 loss mean: 119.03024291992188
nll mean: 117.83841705322266 	 kl mean: 1.026389479637146 	 loss mean: 118.86480712890625


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.65it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
100%|██████████| 10/10 [00:00<00:00, 21.89it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 117.6640625 	 kl mean: 1.026389479637146 	 loss mean: 118.69046020507812
nll mean: 117.86001586914062 	 kl mean: 1.026389479637146 	 loss mean: 118.88639831542969
nll mean: 117.66603088378906 	 kl mean: 1.026389479637146 	 loss mean: 118.69242858886719
nll mean: 90.63294982910156 	 kl mean: 1.5327614545822144 	 loss mean: 92.16571044921875
nll mean: 90.46187591552734 	 kl mean: 1.5327614545822144 	 loss mean: 91.99464416503906
nll mean: 90.1387939453125 	 kl mean: 1.5327614545822144 	 loss mean: 91.67156219482422


                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
 40%|████      | 4/10 [00:00<00:00, 30.93it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
100%|██████████| 10/10 [00:00<00:00, 30.76it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.57it/s]


nll mean: 90.26561737060547 	 kl mean: 1.5327614545822144 	 loss mean: 91.79839324951172
nll mean: 90.23519134521484 	 kl mean: 1.5327614545822144 	 loss mean: 91.76795959472656
nll mean: 90.42448425292969 	 kl mean: 1.5327614545822144 	 loss mean: 91.95723724365234
nll mean: 90.31282043457031 	 kl mean: 1.5327614545822144 	 loss mean: 91.8455810546875
nll mean: 90.1052474975586 	 kl mean: 1.5327614545822144 	 loss mean: 91.63802337646484
nll mean: 90.15972137451172 	 kl mean: 1.5327614545822144 	 loss mean: 91.69248962402344
nll mean: 90.40988159179688 	 kl mean: 1.5327614545822144 	 loss mean: 91.9426498413086
Approximate NLL:
tensor(127.2960, device='cuda:0')
Approximate KL:
tensor(1.0724, device='cuda:0')
Testing took 0:00:25.163200


  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 25.77it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].77it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].77it/s][A

nll mean: 115.79920959472656 	 kl mean: 1.4100086688995361 	 loss mean: 117.209228515625
nll mean: 115.82383728027344 	 kl mean: 1.4100086688995361 	 loss mean: 117.23384857177734
nll mean: 115.93387603759766 	 kl mean: 1.4100086688995361 	 loss mean: 117.34388732910156
nll mean: 115.85189819335938 	 kl mean: 1.4100086688995361 	 loss mean: 117.26190948486328
nll mean: 115.90240478515625 	 kl mean: 1.4100086688995361 	 loss mean: 117.31240844726562



                                              
  0%|          | 0/38 [00:00<?, ?it/s].77it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.34it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].34it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].34it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].34it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.16it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 24.90it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 115.81146240234375 	 kl mean: 1.4100086688995361 	 loss mean: 117.22146606445312
nll mean: 115.97193908691406 	 kl mean: 1.4100086688995361 	 loss mean: 117.38194274902344
nll mean: 116.00181579589844 	 kl mean: 1.4100086688995361 	 loss mean: 117.41181945800781
nll mean: 115.5978012084961 	 kl mean: 1.4100086688995361 	 loss mean: 117.0078125
nll mean: 115.92213439941406 	 kl mean: 1.4100086688995361 	 loss mean: 117.33214569091797


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
 20%|██        | 2/10 [00:00<00:00, 14.09it/s][A

nll mean: 131.00289916992188 	 kl mean: 1.564008116722107 	 loss mean: 132.56690979003906
nll mean: 131.28858947753906 	 kl mean: 1.564008116722107 	 loss mean: 132.85260009765625
nll mean: 131.4696807861328 	 kl mean: 1.564008116722107 	 loss mean: 133.03369140625


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
 20%|██        | 2/10 [00:00<00:00, 14.09it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
 40%|████      | 4/10 [00:00<00:00, 14.03it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.06it/s][A

nll mean: 131.25579833984375 	 kl mean: 1.564008116722107 	 loss mean: 132.81980895996094
nll mean: 131.4293212890625 	 kl mean: 1.564008116722107 	 loss mean: 132.99334716796875
nll mean: 130.96542358398438 	 kl mean: 1.564008116722107 	 loss mean: 132.52943420410156


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.06it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.11it/s][A

nll mean: 131.22134399414062 	 kl mean: 1.564008116722107 	 loss mean: 132.7853546142578
nll mean: 131.39581298828125 	 kl mean: 1.564008116722107 	 loss mean: 132.95980834960938
nll mean: 131.09811401367188 	 kl mean: 1.564008116722107 	 loss mean: 132.662109375


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.11it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.03it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 25.03it/s][A

nll mean: 131.22079467773438 	 kl mean: 1.564008116722107 	 loss mean: 132.78482055664062
nll mean: 103.72297668457031 	 kl mean: 1.2921795845031738 	 loss mean: 105.01515197753906
nll mean: 103.70323181152344 	 kl mean: 1.2921795845031738 	 loss mean: 104.99541473388672
nll mean: 103.82240295410156 	 kl mean: 1.2921795845031738 	 loss mean: 105.11458587646484
nll mean: 103.96031188964844 	 kl mean: 1.2921795845031738 	 loss mean: 105.25248718261719


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 25.03it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.84it/s][A
                                              [A

nll mean: 103.90314483642578 	 kl mean: 1.2921795845031738 	 loss mean: 105.19532775878906
nll mean: 103.58872985839844 	 kl mean: 1.2921795845031738 	 loss mean: 104.88090515136719
nll mean: 103.8109359741211 	 kl mean: 1.2921795845031738 	 loss mean: 105.10311889648438
nll mean: 103.76966857910156 	 kl mean: 1.2921795845031738 	 loss mean: 105.06185150146484
nll mean: 103.97769165039062 	 kl mean: 1.2921795845031738 	 loss mean: 105.26986694335938



  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
100%|██████████| 10/10 [00:00<00:00, 24.75it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
 20%|██        | 2/10 [00:00<00:00, 10.83it/s][A

nll mean: 103.81843566894531 	 kl mean: 1.2921795845031738 	 loss mean: 105.11061096191406
nll mean: 143.2554473876953 	 kl mean: 1.4803009033203125 	 loss mean: 144.73574829101562
nll mean: 143.4201202392578 	 kl mean: 1.4803009033203125 	 loss mean: 144.9004364013672



                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.85it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s][A

nll mean: 143.4205322265625 	 kl mean: 1.4803009033203125 	 loss mean: 144.90084838867188
nll mean: 143.27658081054688 	 kl mean: 1.4803009033203125 	 loss mean: 144.75689697265625
nll mean: 143.39785766601562 	 kl mean: 1.4803009033203125 	 loss mean: 144.878173828125



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.83it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.87it/s][A

nll mean: 143.49945068359375 	 kl mean: 1.4803009033203125 	 loss mean: 144.979736328125
nll mean: 143.37855529785156 	 kl mean: 1.4803009033203125 	 loss mean: 144.85885620117188
nll mean: 143.61822509765625 	 kl mean: 1.4803009033203125 	 loss mean: 145.09854125976562



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.87it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]

nll mean: 143.5040283203125 	 kl mean: 1.4803009033203125 	 loss mean: 144.9843292236328
nll mean: 143.49368286132812 	 kl mean: 1.4803009033203125 	 loss mean: 144.97398376464844
nll mean: 131.19789123535156 	 kl mean: 1.450860857963562 	 loss mean: 132.64877319335938



                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 13.85it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.93it/s][A

nll mean: 131.22079467773438 	 kl mean: 1.450860857963562 	 loss mean: 132.67164611816406
nll mean: 131.21688842773438 	 kl mean: 1.450860857963562 	 loss mean: 132.66775512695312
nll mean: 131.283447265625 	 kl mean: 1.450860857963562 	 loss mean: 132.73431396484375



                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.04it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A

nll mean: 131.48135375976562 	 kl mean: 1.450860857963562 	 loss mean: 132.9322052001953
nll mean: 131.47618103027344 	 kl mean: 1.450860857963562 	 loss mean: 132.9270477294922
nll mean: 131.2625274658203 	 kl mean: 1.450860857963562 	 loss mean: 132.71339416503906



                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.20it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.20it/s][A
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 131.05429077148438 	 kl mean: 1.450860857963562 	 loss mean: 132.50514221191406
nll mean: 131.35186767578125 	 kl mean: 1.450860857963562 	 loss mean: 132.802734375
nll mean: 131.1627655029297 	 kl mean: 1.450860857963562 	 loss mean: 132.61361694335938



                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 14.03it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s][A

nll mean: 128.19407653808594 	 kl mean: 1.4234312772750854 	 loss mean: 129.6175079345703
nll mean: 128.2523651123047 	 kl mean: 1.4234312772750854 	 loss mean: 129.67581176757812
nll mean: 128.27349853515625 	 kl mean: 1.4234312772750854 	 loss mean: 129.69691467285156



                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.05it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.14it/s][A

nll mean: 128.3668212890625 	 kl mean: 1.4234312772750854 	 loss mean: 129.79025268554688
nll mean: 128.4258270263672 	 kl mean: 1.4234312772750854 	 loss mean: 129.8492431640625
nll mean: 128.54885864257812 	 kl mean: 1.4234312772750854 	 loss mean: 129.9722900390625



                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.00it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s][A

nll mean: 128.26629638671875 	 kl mean: 1.4234312772750854 	 loss mean: 129.68972778320312
nll mean: 128.30447387695312 	 kl mean: 1.4234312772750854 	 loss mean: 129.7279052734375
nll mean: 128.29058837890625 	 kl mean: 1.4234312772750854 	 loss mean: 129.71401977539062



                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.08it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 25.68it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A


nll mean: 128.42335510253906 	 kl mean: 1.4234312772750854 	 loss mean: 129.84677124023438
nll mean: 139.2536163330078 	 kl mean: 1.2542568445205688 	 loss mean: 140.50787353515625
nll mean: 139.28147888183594 	 kl mean: 1.2542568445205688 	 loss mean: 140.53573608398438
nll mean: 138.90310668945312 	 kl mean: 1.2542568445205688 	 loss mean: 140.15736389160156
nll mean: 139.04579162597656 	 kl mean: 1.2542568445205688 	 loss mean: 140.300048828125


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.08it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.10it/s][A


nll mean: 139.1688995361328 	 kl mean: 1.2542568445205688 	 loss mean: 140.42315673828125
nll mean: 138.91836547851562 	 kl mean: 1.2542568445205688 	 loss mean: 140.17263793945312
nll mean: 139.3013153076172 	 kl mean: 1.2542568445205688 	 loss mean: 140.55557250976562
nll mean: 139.00738525390625 	 kl mean: 1.2542568445205688 	 loss mean: 140.2616424560547
nll mean: 139.20814514160156 	 kl mean: 1.2542568445205688 	 loss mean: 140.46240234375


                                              
100%|██████████| 10/10 [00:00<00:00, 24.84it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]

nll mean: 139.116943359375 	 kl mean: 1.2542568445205688 	 loss mean: 140.3712158203125
nll mean: 111.3265380859375 	 kl mean: 1.4701457023620605 	 loss mean: 112.79668426513672
nll mean: 111.31605529785156 	 kl mean: 1.4701457023620605 	 loss mean: 112.78620147705078
nll mean: 111.28372955322266 	 kl mean: 1.4701457023620605 	 loss mean: 112.75387573242188
nll mean: 111.44923400878906 	 kl mean: 1.4701457023620605 	 loss mean: 112.91937255859375
nll mean: 111.51046752929688 	 kl mean: 1.4701457023620605 	 loss mean: 112.98060607910156



                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
 30%|███       | 3/10 [00:00<00:00, 25.38it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.31it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
100%|██████████| 10/10 [00:00<00:00, 25.07it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 111.23301696777344 	 kl mean: 1.4701457023620605 	 loss mean: 112.70315551757812
nll mean: 111.17024993896484 	 kl mean: 1.4701457023620605 	 loss mean: 112.64039611816406
nll mean: 111.54923248291016 	 kl mean: 1.4701457023620605 	 loss mean: 113.01937866210938
nll mean: 111.2882080078125 	 kl mean: 1.4701457023620605 	 loss mean: 112.75836181640625
nll mean: 111.42169189453125 	 kl mean: 1.4701457023620605 	 loss mean: 112.89183044433594


                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
 20%|██        | 2/10 [00:00<00:00, 15.27it/s][A
 40%|████      | 4/10 [00:00<00:00, 15.39it/s][A

nll mean: 136.69580078125 	 kl mean: 1.548292636871338 	 loss mean: 138.2440948486328
nll mean: 136.71414184570312 	 kl mean: 1.548292636871338 	 loss mean: 138.26243591308594
nll mean: 136.84617614746094 	 kl mean: 1.548292636871338 	 loss mean: 138.39447021484375
nll mean: 136.7747802734375 	 kl mean: 1.548292636871338 	 loss mean: 138.3230743408203


                                              
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
 40%|████      | 4/10 [00:00<00:00, 15.39it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
                                              [A
[A                                           

nll mean: 136.68161010742188 	 kl mean: 1.548292636871338 	 loss mean: 138.2299041748047
nll mean: 137.04229736328125 	 kl mean: 1.548292636871338 	 loss mean: 138.59060668945312
nll mean: 137.09890747070312 	 kl mean: 1.548292636871338 	 loss mean: 138.64718627929688


 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
 60%|██████    | 6/10 [00:00<00:00, 15.09it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
 80%|████████  | 8/10 [00:00<00:00, 15.11it/s][A
100%|██████████| 10/10 [00:00<00:00, 15.17it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]

nll mean: 136.9668731689453 	 kl mean: 1.548292636871338 	 loss mean: 138.51515197753906
nll mean: 136.908203125 	 kl mean: 1.548292636871338 	 loss mean: 138.45648193359375
nll mean: 136.84518432617188 	 kl mean: 1.548292636871338 	 loss mean: 138.3934783935547
nll mean: 136.64466857910156 	 kl mean: 1.3006585836410522 	 loss mean: 137.94534301757812
nll mean: 136.69802856445312 	 kl mean: 1.3006585836410522 	 loss mean: 137.99868774414062



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]
 30%|███       | 3/10 [00:00<00:00, 21.73it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.49it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A

nll mean: 136.58876037597656 	 kl mean: 1.3006585836410522 	 loss mean: 137.88941955566406
nll mean: 136.70794677734375 	 kl mean: 1.3006585836410522 	 loss mean: 138.00860595703125
nll mean: 136.8440704345703 	 kl mean: 1.3006585836410522 	 loss mean: 138.14474487304688
nll mean: 136.5810546875 	 kl mean: 1.3006585836410522 	 loss mean: 137.88172912597656
nll mean: 136.57542419433594 	 kl mean: 1.3006585836410522 	 loss mean: 137.8760986328125



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.37it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 21.22it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]

nll mean: 136.57122802734375 	 kl mean: 1.3006585836410522 	 loss mean: 137.87188720703125
nll mean: 136.73086547851562 	 kl mean: 1.3006585836410522 	 loss mean: 138.03152465820312
nll mean: 136.74908447265625 	 kl mean: 1.3006585836410522 	 loss mean: 138.04974365234375
nll mean: 123.90292358398438 	 kl mean: 1.5910942554473877 	 loss mean: 125.4940185546875
nll mean: 123.8602294921875 	 kl mean: 1.5910942554473877 	 loss mean: 125.45132446289062



                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
 30%|███       | 3/10 [00:00<00:00, 25.32it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.25it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s][A
                                               
 60%|██████    | 6/10 [00:00<00:00, 25.25it/s]

nll mean: 123.75333404541016 	 kl mean: 1.5910942554473877 	 loss mean: 125.34442901611328
nll mean: 123.5280990600586 	 kl mean: 1.5910942554473877 	 loss mean: 125.11919403076172
nll mean: 123.71334838867188 	 kl mean: 1.5910942554473877 	 loss mean: 125.304443359375
nll mean: 123.64707946777344 	 kl mean: 1.5910942554473877 	 loss mean: 125.23817443847656
nll mean: 123.56961059570312 	 kl mean: 1.5910942554473877 	 loss mean: 125.16070556640625
nll mean: 123.7048110961914 	 kl mean: 1.5910942554473877 	 loss mean: 125.29590606689453


 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.15it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.02it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 21.60it/s][A

nll mean: 123.8656997680664 	 kl mean: 1.5910942554473877 	 loss mean: 125.45679473876953
nll mean: 123.69744110107422 	 kl mean: 1.5910942554473877 	 loss mean: 125.28853607177734
nll mean: 145.52835083007812 	 kl mean: 1.4197120666503906 	 loss mean: 146.9480743408203
nll mean: 145.7266845703125 	 kl mean: 1.4197120666503906 	 loss mean: 147.14639282226562
nll mean: 145.48052978515625 	 kl mean: 1.4197120666503906 	 loss mean: 146.90023803710938


                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 21.60it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.52it/s][A

nll mean: 145.58493041992188 	 kl mean: 1.4197120666503906 	 loss mean: 147.004638671875
nll mean: 145.7826690673828 	 kl mean: 1.4197120666503906 	 loss mean: 147.20237731933594
nll mean: 145.59039306640625 	 kl mean: 1.4197120666503906 	 loss mean: 147.01010131835938
nll mean: 145.8769989013672 	 kl mean: 1.4197120666503906 	 loss mean: 147.2967071533203
nll mean: 145.50515747070312 	 kl mean: 1.4197120666503906 	 loss mean: 146.92486572265625


                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.52it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.01it/s]
100%|██████████| 10/10 [00:00<00:00, 21.25it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s]

nll mean: 145.61004638671875 	 kl mean: 1.4197120666503906 	 loss mean: 147.02976989746094
nll mean: 145.5985107421875 	 kl mean: 1.4197120666503906 	 loss mean: 147.01821899414062
nll mean: 124.48846435546875 	 kl mean: 1.7944728136062622 	 loss mean: 126.2829360961914



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s]
 20%|██        | 2/10 [00:00<00:00, 12.60it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.64it/s][A

nll mean: 124.68221282958984 	 kl mean: 1.7944728136062622 	 loss mean: 126.4766845703125
nll mean: 124.54199981689453 	 kl mean: 1.7944728136062622 	 loss mean: 126.33647155761719
nll mean: 124.69032287597656 	 kl mean: 1.7944728136062622 	 loss mean: 126.48479461669922



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.57it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A

nll mean: 124.5285873413086 	 kl mean: 1.7944728136062622 	 loss mean: 126.32305908203125
nll mean: 124.83270263671875 	 kl mean: 1.7944728136062622 	 loss mean: 126.62718200683594
nll mean: 124.6229476928711 	 kl mean: 1.7944728136062622 	 loss mean: 126.41741943359375



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.54it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.55it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.83903503417969 	 kl mean: 1.7944728136062622 	 loss mean: 126.63351440429688
nll mean: 124.75264739990234 	 kl mean: 1.7944728136062622 	 loss mean: 126.547119140625
nll mean: 124.84732055664062 	 kl mean: 1.7944728136062622 	 loss mean: 126.64179992675781


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 10%|█         | 1/10 [00:00<00:00,  9.92it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.87it/s][A

nll mean: 167.87982177734375 	 kl mean: 1.5896048545837402 	 loss mean: 169.46945190429688
nll mean: 167.7960968017578 	 kl mean: 1.5896048545837402 	 loss mean: 169.38571166992188


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 20%|██        | 2/10 [00:00<00:00,  9.87it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00,  9.83it/s][A
                                               [A

nll mean: 167.69024658203125 	 kl mean: 1.5896048545837402 	 loss mean: 169.27987670898438
nll mean: 167.58804321289062 	 kl mean: 1.5896048545837402 	 loss mean: 169.17764282226562



 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 40%|████      | 4/10 [00:00<00:00,  9.87it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.88it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.85it/s][A

nll mean: 167.6928253173828 	 kl mean: 1.5896048545837402 	 loss mean: 169.28244018554688
nll mean: 167.69998168945312 	 kl mean: 1.5896048545837402 	 loss mean: 169.2895965576172


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.85it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.83it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.91it/s]

nll mean: 167.77586364746094 	 kl mean: 1.5896048545837402 	 loss mean: 169.365478515625
nll mean: 167.93788146972656 	 kl mean: 1.5896048545837402 	 loss mean: 169.52749633789062
nll mean: 167.87271118164062 	 kl mean: 1.5896048545837402 	 loss mean: 169.46231079101562


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.91it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.88it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.24it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A

nll mean: 167.43838500976562 	 kl mean: 1.5896048545837402 	 loss mean: 169.02798461914062
nll mean: 140.55931091308594 	 kl mean: 1.3634955883026123 	 loss mean: 141.9228057861328
nll mean: 140.73980712890625 	 kl mean: 1.3634955883026123 	 loss mean: 142.10330200195312
nll mean: 140.95315551757812 	 kl mean: 1.3634955883026123 	 loss mean: 142.316650390625



                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 40%|████      | 4/10 [00:00<00:00, 18.13it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 60%|██████    | 6/10 [00:00<00:00, 18.04it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A

nll mean: 140.6117706298828 	 kl mean: 1.3634955883026123 	 loss mean: 141.9752655029297
nll mean: 140.77532958984375 	 kl mean: 1.3634955883026123 	 loss mean: 142.13882446289062
nll mean: 140.71490478515625 	 kl mean: 1.3634955883026123 	 loss mean: 142.07839965820312
nll mean: 140.8931884765625 	 kl mean: 1.3634955883026123 	 loss mean: 142.25668334960938



                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 80%|████████  | 8/10 [00:00<00:00, 17.99it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.94it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 140.918212890625 	 kl mean: 1.3634955883026123 	 loss mean: 142.2816925048828
nll mean: 140.79397583007812 	 kl mean: 1.3634955883026123 	 loss mean: 142.157470703125
nll mean: 140.8424835205078 	 kl mean: 1.3634955883026123 	 loss mean: 142.2059783935547



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 20%|██        | 2/10 [00:00<00:00, 10.79it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A

nll mean: 147.63922119140625 	 kl mean: 1.6314830780029297 	 loss mean: 149.2707061767578
nll mean: 147.5389404296875 	 kl mean: 1.6314830780029297 	 loss mean: 149.17042541503906
nll mean: 147.5823974609375 	 kl mean: 1.6314830780029297 	 loss mean: 149.2138671875



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.77it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.76it/s][A

nll mean: 147.77374267578125 	 kl mean: 1.6314830780029297 	 loss mean: 149.4052276611328
nll mean: 147.7865447998047 	 kl mean: 1.6314830780029297 	 loss mean: 149.41802978515625
nll mean: 147.55685424804688 	 kl mean: 1.6314830780029297 	 loss mean: 149.18832397460938



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.76it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A

nll mean: 148.00650024414062 	 kl mean: 1.6314830780029297 	 loss mean: 149.63800048828125
nll mean: 147.57638549804688 	 kl mean: 1.6314830780029297 	 loss mean: 149.2078857421875
nll mean: 147.78271484375 	 kl mean: 1.6314830780029297 	 loss mean: 149.41419982910156



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.72it/s][A
 42%|████▏     | 16/38 [00:09<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 25.06it/s][A

nll mean: 147.617431640625 	 kl mean: 1.6314830780029297 	 loss mean: 149.24891662597656
nll mean: 149.32247924804688 	 kl mean: 1.3673171997070312 	 loss mean: 150.68978881835938
nll mean: 149.4100799560547 	 kl mean: 1.3673171997070312 	 loss mean: 150.77740478515625
nll mean: 149.50491333007812 	 kl mean: 1.3673171997070312 	 loss mean: 150.8722381591797
nll mean: 149.3131103515625 	 kl mean: 1.3673171997070312 	 loss mean: 150.68040466308594


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 25.06it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.89it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.86it/s][A

nll mean: 149.674560546875 	 kl mean: 1.3673171997070312 	 loss mean: 151.0418701171875
nll mean: 149.35838317871094 	 kl mean: 1.3673171997070312 	 loss mean: 150.7257080078125
nll mean: 149.29913330078125 	 kl mean: 1.3673171997070312 	 loss mean: 150.66644287109375
nll mean: 149.3048858642578 	 kl mean: 1.3673171997070312 	 loss mean: 150.67221069335938
nll mean: 149.6323699951172 	 kl mean: 1.3673171997070312 	 loss mean: 150.99969482421875


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
100%|██████████| 10/10 [00:00<00:00, 24.76it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 25.22it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A


nll mean: 149.776123046875 	 kl mean: 1.3673171997070312 	 loss mean: 151.1434326171875
nll mean: 137.92398071289062 	 kl mean: 1.4023226499557495 	 loss mean: 139.3262939453125
nll mean: 138.16659545898438 	 kl mean: 1.4023226499557495 	 loss mean: 139.56890869140625
nll mean: 138.11590576171875 	 kl mean: 1.4023226499557495 	 loss mean: 139.51821899414062
nll mean: 138.2625732421875 	 kl mean: 1.4023226499557495 	 loss mean: 139.66488647460938


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.08it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.00it/s][A


nll mean: 138.20101928710938 	 kl mean: 1.4023226499557495 	 loss mean: 139.6033477783203
nll mean: 137.86380004882812 	 kl mean: 1.4023226499557495 	 loss mean: 139.26614379882812
nll mean: 138.12594604492188 	 kl mean: 1.4023226499557495 	 loss mean: 139.5282745361328
nll mean: 137.98110961914062 	 kl mean: 1.4023226499557495 	 loss mean: 139.38343811035156
nll mean: 138.01971435546875 	 kl mean: 1.4023226499557495 	 loss mean: 139.42202758789062


                                               
100%|██████████| 10/10 [00:00<00:00, 24.82it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
 20%|██        | 2/10 [00:00<00:00, 12.54it/s][A

nll mean: 138.126708984375 	 kl mean: 1.4023226499557495 	 loss mean: 139.529052734375
nll mean: 135.86978149414062 	 kl mean: 1.4835121631622314 	 loss mean: 137.35328674316406
nll mean: 135.86663818359375 	 kl mean: 1.4835121631622314 	 loss mean: 137.3501434326172



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.49it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s][A

nll mean: 135.86610412597656 	 kl mean: 1.4835121631622314 	 loss mean: 137.34962463378906
nll mean: 135.9613800048828 	 kl mean: 1.4835121631622314 	 loss mean: 137.4449005126953
nll mean: 135.86798095703125 	 kl mean: 1.4835121631622314 	 loss mean: 137.3514862060547



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.54it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.68it/s][A

nll mean: 136.02764892578125 	 kl mean: 1.4835121631622314 	 loss mean: 137.51116943359375
nll mean: 135.8466796875 	 kl mean: 1.4835121631622314 	 loss mean: 137.33018493652344
nll mean: 135.8258056640625 	 kl mean: 1.4835121631622314 	 loss mean: 137.309326171875



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.66it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]

nll mean: 135.7762908935547 	 kl mean: 1.4835121631622314 	 loss mean: 137.25979614257812
nll mean: 135.68414306640625 	 kl mean: 1.4835121631622314 	 loss mean: 137.16766357421875
nll mean: 154.01113891601562 	 kl mean: 1.4653010368347168 	 loss mean: 155.4764404296875



                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 12.63it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.55it/s][A

nll mean: 154.29147338867188 	 kl mean: 1.4653010368347168 	 loss mean: 155.75677490234375
nll mean: 154.09573364257812 	 kl mean: 1.4653010368347168 	 loss mean: 155.56105041503906
nll mean: 154.1190185546875 	 kl mean: 1.4653010368347168 	 loss mean: 155.58432006835938



                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.62it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s][A

nll mean: 153.89427185058594 	 kl mean: 1.4653010368347168 	 loss mean: 155.3595733642578
nll mean: 154.21316528320312 	 kl mean: 1.4653010368347168 	 loss mean: 155.67845153808594
nll mean: 154.173583984375 	 kl mean: 1.4653010368347168 	 loss mean: 155.63888549804688



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.68it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.70it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 154.14910888671875 	 kl mean: 1.4653010368347168 	 loss mean: 155.61441040039062
nll mean: 154.21583557128906 	 kl mean: 1.4653010368347168 	 loss mean: 155.68113708496094
nll mean: 154.31240844726562 	 kl mean: 1.4653010368347168 	 loss mean: 155.7777099609375



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 12.55it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s][A

nll mean: 162.82257080078125 	 kl mean: 1.3488521575927734 	 loss mean: 164.17141723632812
nll mean: 162.94046020507812 	 kl mean: 1.3488521575927734 	 loss mean: 164.289306640625
nll mean: 162.9557342529297 	 kl mean: 1.3488521575927734 	 loss mean: 164.30459594726562



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.54it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.68it/s][A

nll mean: 162.75827026367188 	 kl mean: 1.3488521575927734 	 loss mean: 164.10711669921875
nll mean: 162.9713897705078 	 kl mean: 1.3488521575927734 	 loss mean: 164.3202362060547
nll mean: 162.86935424804688 	 kl mean: 1.3488521575927734 	 loss mean: 164.21823120117188



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.46it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.72it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.46it/s][A

nll mean: 163.01304626464844 	 kl mean: 1.3488521575927734 	 loss mean: 164.36190795898438
nll mean: 162.8205108642578 	 kl mean: 1.3488521575927734 	 loss mean: 164.16937255859375
nll mean: 163.11151123046875 	 kl mean: 1.3488521575927734 	 loss mean: 164.46035766601562



                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.72it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.37it/s][A

nll mean: 163.03016662597656 	 kl mean: 1.3488521575927734 	 loss mean: 164.37901306152344
nll mean: 122.3669204711914 	 kl mean: 1.5867149829864502 	 loss mean: 123.95364379882812
nll mean: 122.16624450683594 	 kl mean: 1.5867149829864502 	 loss mean: 123.7529525756836


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 10.37it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 10.36it/s][A

nll mean: 122.65538787841797 	 kl mean: 1.5867149829864502 	 loss mean: 124.24210357666016
nll mean: 122.31017303466797 	 kl mean: 1.5867149829864502 	 loss mean: 123.89688110351562
nll mean: 122.45468139648438 	 kl mean: 1.5867149829864502 	 loss mean: 124.04139709472656


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 10.36it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.34it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.35it/s][A

nll mean: 122.01984405517578 	 kl mean: 1.5867149829864502 	 loss mean: 123.6065673828125
nll mean: 122.39742279052734 	 kl mean: 1.5867149829864502 	 loss mean: 123.984130859375
nll mean: 122.25042724609375 	 kl mean: 1.5867149829864502 	 loss mean: 123.83714294433594


                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.40it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.35it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.32it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]

nll mean: 122.33348083496094 	 kl mean: 1.5867149829864502 	 loss mean: 123.92021179199219
nll mean: 122.37327575683594 	 kl mean: 1.5867149829864502 	 loss mean: 123.95999145507812
nll mean: 112.10669708251953 	 kl mean: 1.0760775804519653 	 loss mean: 113.18277740478516
nll mean: 112.07029724121094 	 kl mean: 1.0760775804519653 	 loss mean: 113.14637756347656
nll mean: 112.01144409179688 	 kl mean: 1.0760775804519653 	 loss mean: 113.0875244140625



                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
 40%|████      | 4/10 [00:00<00:00, 33.42it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s][A
 80%|████████  | 8/10 [00:00<00:00, 33.14it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 32.86it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 112.096435546875 	 kl mean: 1.0760775804519653 	 loss mean: 113.1725082397461
nll mean: 112.0616226196289 	 kl mean: 1.0760775804519653 	 loss mean: 113.13771057128906
nll mean: 112.1558837890625 	 kl mean: 1.0760775804519653 	 loss mean: 113.23196411132812
nll mean: 112.03955078125 	 kl mean: 1.0760775804519653 	 loss mean: 113.11563110351562
nll mean: 112.02876281738281 	 kl mean: 1.0760775804519653 	 loss mean: 113.10484313964844
nll mean: 112.02410125732422 	 kl mean: 1.0760775804519653 	 loss mean: 113.10017395019531
nll mean: 112.00032043457031 	 kl mean: 1.0760775804519653 	 loss mean: 113.0763931274414



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 14.89it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
                                               

nll mean: 164.8595428466797 	 kl mean: 1.2688090801239014 	 loss mean: 166.12835693359375
nll mean: 164.5574188232422 	 kl mean: 1.2688090801239014 	 loss mean: 165.82623291015625
nll mean: 164.34141540527344 	 kl mean: 1.2688090801239014 	 loss mean: 165.6102294921875



 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.88it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.84it/s][A

nll mean: 164.78421020507812 	 kl mean: 1.2688090801239014 	 loss mean: 166.0530242919922
nll mean: 164.77938842773438 	 kl mean: 1.2688090801239014 	 loss mean: 166.04818725585938
nll mean: 164.7110137939453 	 kl mean: 1.2688090801239014 	 loss mean: 165.97982788085938



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.86it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.55it/s][A

nll mean: 164.70736694335938 	 kl mean: 1.2688090801239014 	 loss mean: 165.97618103027344
nll mean: 164.69387817382812 	 kl mean: 1.2688090801239014 	 loss mean: 165.9626922607422
nll mean: 164.39581298828125 	 kl mean: 1.2688090801239014 	 loss mean: 165.6646270751953



                                               
 61%|██████    | 23/38 [00:15<00:09,  1.55it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.80it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 22.13it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A

nll mean: 164.6609649658203 	 kl mean: 1.2688090801239014 	 loss mean: 165.92977905273438
nll mean: 125.87158203125 	 kl mean: 1.3181190490722656 	 loss mean: 127.18971252441406
nll mean: 125.96454620361328 	 kl mean: 1.3181190490722656 	 loss mean: 127.28266906738281
nll mean: 125.95870971679688 	 kl mean: 1.3181190490722656 	 loss mean: 127.27682495117188
nll mean: 125.64817810058594 	 kl mean: 1.3181190490722656 	 loss mean: 126.96629333496094



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.79it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.73it/s][A

nll mean: 126.15846252441406 	 kl mean: 1.3181190490722656 	 loss mean: 127.47659301757812
nll mean: 125.94725799560547 	 kl mean: 1.3181190490722656 	 loss mean: 127.26537322998047
nll mean: 125.63729858398438 	 kl mean: 1.3181190490722656 	 loss mean: 126.95541381835938
nll mean: 125.89847564697266 	 kl mean: 1.3181190490722656 	 loss mean: 127.21659851074219
nll mean: 125.65140533447266 	 kl mean: 1.3181190490722656 	 loss mean: 126.96952819824219



                                               
100%|██████████| 10/10 [00:00<00:00, 21.49it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s]
 20%|██        | 2/10 [00:00<00:00, 14.87it/s][A

nll mean: 126.0078125 	 kl mean: 1.3181190490722656 	 loss mean: 127.32593536376953
nll mean: 118.83809661865234 	 kl mean: 1.3022555112838745 	 loss mean: 120.14035034179688
nll mean: 118.63902282714844 	 kl mean: 1.3022555112838745 	 loss mean: 119.94126892089844



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.80it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.67it/s][A

nll mean: 118.5745620727539 	 kl mean: 1.3022555112838745 	 loss mean: 119.87681579589844
nll mean: 118.8505630493164 	 kl mean: 1.3022555112838745 	 loss mean: 120.15281677246094
nll mean: 118.86170959472656 	 kl mean: 1.3022555112838745 	 loss mean: 120.16397094726562



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.67it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.81it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.67it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.67it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.78it/s][A

nll mean: 118.79412078857422 	 kl mean: 1.3022555112838745 	 loss mean: 120.09638214111328
nll mean: 118.81278228759766 	 kl mean: 1.3022555112838745 	 loss mean: 120.11503601074219
nll mean: 118.73431396484375 	 kl mean: 1.3022555112838745 	 loss mean: 120.03656768798828



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.67it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.67it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.75it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.8116226196289 	 kl mean: 1.3022555112838745 	 loss mean: 120.11387634277344
nll mean: 118.79898071289062 	 kl mean: 1.3022555112838745 	 loss mean: 120.10123443603516
nll mean: 87.774169921875 	 kl mean: 1.3738670349121094 	 loss mean: 89.14804077148438
nll mean: 87.70181274414062 	 kl mean: 1.3738670349121094 	 loss mean: 89.07568359375


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00, 21.43it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.74it/s][A

nll mean: 87.71139526367188 	 kl mean: 1.3738670349121094 	 loss mean: 89.08526611328125
nll mean: 87.72129821777344 	 kl mean: 1.3738670349121094 	 loss mean: 89.09516906738281
nll mean: 87.55325317382812 	 kl mean: 1.3738670349121094 	 loss mean: 88.9271240234375
nll mean: 87.63926696777344 	 kl mean: 1.3738670349121094 	 loss mean: 89.01313781738281
nll mean: 87.75132751464844 	 kl mean: 1.3738670349121094 	 loss mean: 89.12519836425781


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.74it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
100%|██████████| 10/10 [00:00<00:00, 22.17it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 87.8656234741211 	 kl mean: 1.3738670349121094 	 loss mean: 89.23948669433594
nll mean: 87.88163757324219 	 kl mean: 1.3738670349121094 	 loss mean: 89.25550842285156
nll mean: 87.62384033203125 	 kl mean: 1.3738670349121094 	 loss mean: 88.99771118164062
nll mean: 113.8887939453125 	 kl mean: 1.101811408996582 	 loss mean: 114.9906005859375
nll mean: 113.6124267578125 	 kl mean: 1.101811408996582 	 loss mean: 114.71424865722656


                                               
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.75it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.75it/s]
 30%|███       | 3/10 [00:00<00:00, 22.27it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.75it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.02it/s][A

nll mean: 113.70913696289062 	 kl mean: 1.101811408996582 	 loss mean: 114.81094360351562
nll mean: 113.91757202148438 	 kl mean: 1.101811408996582 	 loss mean: 115.01937866210938
nll mean: 113.78973388671875 	 kl mean: 1.101811408996582 	 loss mean: 114.89155578613281
nll mean: 113.90660858154297 	 kl mean: 1.101811408996582 	 loss mean: 115.0084228515625
nll mean: 113.63633728027344 	 kl mean: 1.101811408996582 	 loss mean: 114.73815155029297


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.75it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.75it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.02it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.75it/s]
100%|██████████| 10/10 [00:00<00:00, 21.80it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.86it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.86it/s]

nll mean: 113.96249389648438 	 kl mean: 1.101811408996582 	 loss mean: 115.0643081665039
nll mean: 113.82701110839844 	 kl mean: 1.101811408996582 	 loss mean: 114.92881774902344
nll mean: 113.70958709716797 	 kl mean: 1.101811408996582 	 loss mean: 114.8114013671875
nll mean: 125.70929718017578 	 kl mean: 1.3953264951705933 	 loss mean: 127.10462188720703



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.86it/s]
 20%|██        | 2/10 [00:00<00:00, 12.15it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.86it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.86it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.31it/s][A

nll mean: 126.01464080810547 	 kl mean: 1.3953264951705933 	 loss mean: 127.40997314453125
nll mean: 126.14918518066406 	 kl mean: 1.3953264951705933 	 loss mean: 127.54450988769531
nll mean: 125.82737731933594 	 kl mean: 1.3953264951705933 	 loss mean: 127.22270202636719



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.86it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.86it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.44it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.86it/s][A

nll mean: 125.84661865234375 	 kl mean: 1.3953264951705933 	 loss mean: 127.24195098876953
nll mean: 125.77326965332031 	 kl mean: 1.3953264951705933 	 loss mean: 127.16858673095703
nll mean: 125.72863006591797 	 kl mean: 1.3953264951705933 	 loss mean: 127.12394714355469



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.86it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.86it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.86it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.61it/s][A
 76%|███████▋  | 29/38 [00:17<00:05,  1.62it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 125.63143920898438 	 kl mean: 1.3953264951705933 	 loss mean: 127.02677154541016
nll mean: 125.75462341308594 	 kl mean: 1.3953264951705933 	 loss mean: 127.14994812011719
nll mean: 125.8734130859375 	 kl mean: 1.3953264951705933 	 loss mean: 127.26873779296875



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
 20%|██        | 2/10 [00:00<00:00, 10.24it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A

nll mean: 66.35044860839844 	 kl mean: 1.7469960451126099 	 loss mean: 68.09744262695312
nll mean: 66.14906311035156 	 kl mean: 1.7469960451126099 	 loss mean: 67.89605712890625
nll mean: 65.93350219726562 	 kl mean: 1.7469960451126099 	 loss mean: 67.68049621582031



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.22it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.22it/s][A

nll mean: 65.96501159667969 	 kl mean: 1.7469960451126099 	 loss mean: 67.71200561523438
nll mean: 66.01473999023438 	 kl mean: 1.7469960451126099 	 loss mean: 67.76173400878906
nll mean: 66.09790802001953 	 kl mean: 1.7469960451126099 	 loss mean: 67.84490966796875



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.21it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A

nll mean: 66.17416381835938 	 kl mean: 1.7469960451126099 	 loss mean: 67.9211654663086
nll mean: 66.17857360839844 	 kl mean: 1.7469960451126099 	 loss mean: 67.92556762695312
nll mean: 66.31205749511719 	 kl mean: 1.7469960451126099 	 loss mean: 68.0590591430664



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.22it/s][A
 79%|███████▉  | 30/38 [00:18<00:05,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 13.28it/s][A

nll mean: 66.17118835449219 	 kl mean: 1.7469960451126099 	 loss mean: 67.9181900024414
nll mean: 109.49833679199219 	 kl mean: 1.6031956672668457 	 loss mean: 111.10153198242188
nll mean: 109.6827163696289 	 kl mean: 1.6031956672668457 	 loss mean: 111.28591918945312



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.03it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A

nll mean: 109.42890167236328 	 kl mean: 1.6031956672668457 	 loss mean: 111.03209686279297
nll mean: 109.76177215576172 	 kl mean: 1.6031956672668457 	 loss mean: 111.3649673461914
nll mean: 109.69134521484375 	 kl mean: 1.6031956672668457 	 loss mean: 111.29454040527344



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.90it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.86it/s][A

nll mean: 109.56573486328125 	 kl mean: 1.6031956672668457 	 loss mean: 111.16893005371094
nll mean: 109.63203430175781 	 kl mean: 1.6031956672668457 	 loss mean: 111.2352294921875
nll mean: 109.44401550292969 	 kl mean: 1.6031956672668457 	 loss mean: 111.04721069335938



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.78it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]

nll mean: 109.54264831542969 	 kl mean: 1.6031956672668457 	 loss mean: 111.14584350585938
nll mean: 109.62996673583984 	 kl mean: 1.6031956672668457 	 loss mean: 111.23316955566406
nll mean: 142.1649627685547 	 kl mean: 1.3799428939819336 	 loss mean: 143.54489135742188



                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.35it/s]
 20%|██        | 2/10 [00:00<00:00, 10.24it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.21it/s][A

nll mean: 142.54452514648438 	 kl mean: 1.3799428939819336 	 loss mean: 143.92446899414062
nll mean: 142.46304321289062 	 kl mean: 1.3799428939819336 	 loss mean: 143.84298706054688
nll mean: 142.09278869628906 	 kl mean: 1.3799428939819336 	 loss mean: 143.47271728515625



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.08it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.02it/s][A


nll mean: 142.43417358398438 	 kl mean: 1.3799428939819336 	 loss mean: 143.81411743164062
nll mean: 142.24063110351562 	 kl mean: 1.3799428939819336 	 loss mean: 143.62057495117188


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.98it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.94it/s][A
                                               


nll mean: 142.2015838623047 	 kl mean: 1.3799428939819336 	 loss mean: 143.58152770996094
nll mean: 142.45950317382812 	 kl mean: 1.3799428939819336 	 loss mean: 143.8394317626953
nll mean: 142.2658233642578 	 kl mean: 1.3799428939819336 	 loss mean: 143.64576721191406


 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.35it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.03it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
 30%|███       | 3/10 [00:00<00:00, 25.90it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s][A

nll mean: 142.3148193359375 	 kl mean: 1.3799428939819336 	 loss mean: 143.69476318359375
nll mean: 66.05613708496094 	 kl mean: 1.464903712272644 	 loss mean: 67.52104187011719
nll mean: 66.06599426269531 	 kl mean: 1.464903712272644 	 loss mean: 67.53089904785156
nll mean: 65.8345718383789 	 kl mean: 1.464903712272644 	 loss mean: 67.29947662353516
nll mean: 66.09342193603516 	 kl mean: 1.464903712272644 	 loss mean: 67.5583267211914
nll mean: 66.06206512451172 	 kl mean: 1.464903712272644 	 loss mean: 67.52696990966797



                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.74it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.65it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.56it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 66.13492584228516 	 kl mean: 1.464903712272644 	 loss mean: 67.59982299804688
nll mean: 65.92190551757812 	 kl mean: 1.464903712272644 	 loss mean: 67.38681030273438
nll mean: 66.02030944824219 	 kl mean: 1.464903712272644 	 loss mean: 67.48521423339844
nll mean: 66.02059173583984 	 kl mean: 1.464903712272644 	 loss mean: 67.4854965209961
nll mean: 66.0748291015625 	 kl mean: 1.464903712272644 	 loss mean: 67.53973388671875


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 30%|███       | 3/10 [00:00<00:00, 22.06it/s][A

nll mean: 123.81840515136719 	 kl mean: 1.2299844026565552 	 loss mean: 125.04838562011719
nll mean: 124.19551849365234 	 kl mean: 1.2299844026565552 	 loss mean: 125.42550659179688
nll mean: 124.17385864257812 	 kl mean: 1.2299844026565552 	 loss mean: 125.40383911132812
nll mean: 124.12567138671875 	 kl mean: 1.2299844026565552 	 loss mean: 125.35565185546875
nll mean: 124.10964965820312 	 kl mean: 1.2299844026565552 	 loss mean: 125.33963775634766


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 30%|███       | 3/10 [00:00<00:00, 22.06it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.98it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
100%|██████████| 10/10 [00:00<00:00, 21.88it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.03337860107422 	 kl mean: 1.2299844026565552 	 loss mean: 125.26336669921875
nll mean: 124.27774047851562 	 kl mean: 1.2299844026565552 	 loss mean: 125.50773620605469
nll mean: 124.19943237304688 	 kl mean: 1.2299844026565552 	 loss mean: 125.42941284179688
nll mean: 124.19049072265625 	 kl mean: 1.2299844026565552 	 loss mean: 125.42047119140625
nll mean: 124.16439056396484 	 kl mean: 1.2299844026565552 	 loss mean: 125.39437866210938



                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 12.48it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s][A

nll mean: 124.80671691894531 	 kl mean: 1.4231326580047607 	 loss mean: 126.22984313964844
nll mean: 124.90113830566406 	 kl mean: 1.4231326580047607 	 loss mean: 126.32427978515625
nll mean: 124.69047546386719 	 kl mean: 1.4231326580047607 	 loss mean: 126.11360931396484



                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.61it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.53it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.61it/s][A

nll mean: 124.80137634277344 	 kl mean: 1.4231326580047607 	 loss mean: 126.2245101928711
nll mean: 124.97831726074219 	 kl mean: 1.4231326580047607 	 loss mean: 126.40144348144531
nll mean: 125.06685638427734 	 kl mean: 1.4231326580047607 	 loss mean: 126.489990234375



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.68it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s][A

nll mean: 124.96854400634766 	 kl mean: 1.4231326580047607 	 loss mean: 126.39168548583984
nll mean: 124.822509765625 	 kl mean: 1.4231326580047607 	 loss mean: 126.24563598632812
nll mean: 124.84407043457031 	 kl mean: 1.4231326580047607 	 loss mean: 126.26719665527344



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.61it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.69it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.77it/s][A

nll mean: 124.7210693359375 	 kl mean: 1.4231326580047607 	 loss mean: 126.14421081542969
nll mean: 118.07073211669922 	 kl mean: 1.4007399082183838 	 loss mean: 119.47146606445312
nll mean: 118.16294860839844 	 kl mean: 1.4007399082183838 	 loss mean: 119.56367492675781


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
 20%|██        | 2/10 [00:00<00:00, 10.77it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 10.71it/s][A

nll mean: 118.23688507080078 	 kl mean: 1.4007399082183838 	 loss mean: 119.63761901855469
nll mean: 117.99176788330078 	 kl mean: 1.4007399082183838 	 loss mean: 119.39250946044922
nll mean: 118.2340087890625 	 kl mean: 1.4007399082183838 	 loss mean: 119.63475036621094


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 10.71it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.49it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.49it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.70it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.63it/s][A

nll mean: 118.31993103027344 	 kl mean: 1.4007399082183838 	 loss mean: 119.72067260742188
nll mean: 118.21739196777344 	 kl mean: 1.4007399082183838 	 loss mean: 119.61813354492188
nll mean: 118.09660339355469 	 kl mean: 1.4007399082183838 	 loss mean: 119.49734497070312


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.49it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.49it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.63it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.61it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]

nll mean: 117.8785400390625 	 kl mean: 1.4007399082183838 	 loss mean: 119.27928161621094
nll mean: 118.27267456054688 	 kl mean: 1.4007399082183838 	 loss mean: 119.67342376708984
nll mean: 117.01862335205078 	 kl mean: 1.3737821578979492 	 loss mean: 118.39241027832031
nll mean: 117.26020812988281 	 kl mean: 1.3737821578979492 	 loss mean: 118.63398742675781



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 21.36it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.44it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A

nll mean: 117.2030258178711 	 kl mean: 1.3737821578979492 	 loss mean: 118.5768051147461
nll mean: 117.21976470947266 	 kl mean: 1.3737821578979492 	 loss mean: 118.59354400634766
nll mean: 117.22893524169922 	 kl mean: 1.3737821578979492 	 loss mean: 118.60272216796875
nll mean: 117.10328674316406 	 kl mean: 1.3737821578979492 	 loss mean: 118.47706604003906
nll mean: 117.34941101074219 	 kl mean: 1.3737821578979492 	 loss mean: 118.72319030761719



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.33it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.40it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.46it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 29.19it/s][A

nll mean: 117.33506774902344 	 kl mean: 1.3737821578979492 	 loss mean: 118.70884704589844
nll mean: 117.28362274169922 	 kl mean: 1.3737821578979492 	 loss mean: 118.65740203857422
nll mean: 117.33699798583984 	 kl mean: 1.3737821578979492 	 loss mean: 118.71078491210938
nll mean: 89.55122375488281 	 kl mean: 1.8622530698776245 	 loss mean: 91.4134750366211
nll mean: 89.28904724121094 	 kl mean: 1.8622530698776245 	 loss mean: 91.15129852294922
nll mean: 89.05168151855469 	 kl mean: 1.8622530698776245 	 loss mean: 90.91392517089844


                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:23<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
 30%|███       | 3/10 [00:00<00:00, 29.19it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 29.04it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 29.01it/s][A

nll mean: 89.10653686523438 	 kl mean: 1.8622530698776245 	 loss mean: 90.96879577636719
nll mean: 89.0975341796875 	 kl mean: 1.8622530698776245 	 loss mean: 90.95979309082031
nll mean: 88.64952850341797 	 kl mean: 1.8622530698776245 	 loss mean: 90.51177978515625
nll mean: 89.28926849365234 	 kl mean: 1.8622530698776245 	 loss mean: 91.15151977539062
nll mean: 89.1715087890625 	 kl mean: 1.8622530698776245 	 loss mean: 91.03376770019531
nll mean: 89.46526336669922 	 kl mean: 1.8622530698776245 	 loss mean: 91.3275146484375


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
100%|██████████| 10/10 [00:00<00:00, 28.84it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.57it/s]


nll mean: 89.32158660888672 	 kl mean: 1.8622530698776245 	 loss mean: 91.183837890625
Approximate NLL:
tensor(126.4909, device='cuda:0')
Approximate KL:
tensor(1.4329, device='cuda:0')
Testing took 0:00:25.131638


  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .85it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .85it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.85it/s][A

nll mean: 115.12419128417969 	 kl mean: 1.020707368850708 	 loss mean: 116.14490509033203
nll mean: 114.99970245361328 	 kl mean: 1.020707368850708 	 loss mean: 116.02041625976562
nll mean: 115.20944213867188 	 kl mean: 1.020707368850708 	 loss mean: 116.23014068603516
nll mean: 115.22512817382812 	 kl mean: 1.020707368850708 	 loss mean: 116.24584197998047
nll mean: 115.22010803222656 	 kl mean: 1.020707368850708 	 loss mean: 116.24081420898438


                                      
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.85it/s][A
                                      .52it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .52it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .52it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 25.52it/s][A
                                      .29it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 25.05it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 115.04019165039062 	 kl mean: 1.020707368850708 	 loss mean: 116.06090545654297
nll mean: 115.1710433959961 	 kl mean: 1.020707368850708 	 loss mean: 116.19175720214844
nll mean: 115.29483032226562 	 kl mean: 1.020707368850708 	 loss mean: 116.31554412841797
nll mean: 114.96208953857422 	 kl mean: 1.020707368850708 	 loss mean: 115.98280334472656
nll mean: 115.18794250488281 	 kl mean: 1.020707368850708 	 loss mean: 116.20864868164062


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
 20%|██        | 2/10 [00:00<00:00, 14.36it/s][A

nll mean: 130.73696899414062 	 kl mean: 1.2991843223571777 	 loss mean: 132.03616333007812
nll mean: 130.9482421875 	 kl mean: 1.2991843223571777 	 loss mean: 132.24740600585938
nll mean: 130.89517211914062 	 kl mean: 1.2991843223571777 	 loss mean: 132.19436645507812


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
 20%|██        | 2/10 [00:00<00:00, 14.36it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
 40%|████      | 4/10 [00:00<00:00, 14.36it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.28it/s][A

nll mean: 131.02615356445312 	 kl mean: 1.2991843223571777 	 loss mean: 132.32533264160156
nll mean: 130.74444580078125 	 kl mean: 1.2991843223571777 	 loss mean: 132.04364013671875
nll mean: 130.94869995117188 	 kl mean: 1.2991843223571777 	 loss mean: 132.2478790283203


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.28it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.49it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.28it/s][A

nll mean: 130.97023010253906 	 kl mean: 1.2991843223571777 	 loss mean: 132.2694091796875
nll mean: 131.1636962890625 	 kl mean: 1.2991843223571777 	 loss mean: 132.462890625
nll mean: 130.76611328125 	 kl mean: 1.2991843223571777 	 loss mean: 132.0653076171875


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.49it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.28it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.27it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 30%|███       | 3/10 [00:00<00:00, 25.58it/s][A

nll mean: 130.91529846191406 	 kl mean: 1.2991843223571777 	 loss mean: 132.21449279785156
nll mean: 103.16380310058594 	 kl mean: 1.0679515600204468 	 loss mean: 104.23175048828125
nll mean: 103.44956970214844 	 kl mean: 1.0679515600204468 	 loss mean: 104.51752471923828
nll mean: 103.20458984375 	 kl mean: 1.0679515600204468 	 loss mean: 104.27254486083984
nll mean: 103.32331848144531 	 kl mean: 1.0679515600204468 	 loss mean: 104.39126586914062


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 30%|███       | 3/10 [00:00<00:00, 25.58it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.30it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.05it/s][A

nll mean: 103.12065124511719 	 kl mean: 1.0679515600204468 	 loss mean: 104.18860626220703
nll mean: 103.19124603271484 	 kl mean: 1.0679515600204468 	 loss mean: 104.25920104980469
nll mean: 103.06297302246094 	 kl mean: 1.0679515600204468 	 loss mean: 104.13092041015625
nll mean: 103.06352996826172 	 kl mean: 1.0679515600204468 	 loss mean: 104.13148498535156
nll mean: 103.22209167480469 	 kl mean: 1.0679515600204468 	 loss mean: 104.29004669189453


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
100%|██████████| 10/10 [00:00<00:00, 24.85it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.83it/s][A

nll mean: 103.21607208251953 	 kl mean: 1.0679515600204468 	 loss mean: 104.28402709960938
nll mean: 143.9958953857422 	 kl mean: 1.2071609497070312 	 loss mean: 145.20306396484375
nll mean: 143.9319305419922 	 kl mean: 1.2071609497070312 	 loss mean: 145.13909912109375


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
 20%|██        | 2/10 [00:00<00:00, 10.83it/s][A
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.15it/s]
 40%|████      | 4/10 [00:00<00:00, 10.89it/s][A

nll mean: 144.02334594726562 	 kl mean: 1.2071609497070312 	 loss mean: 145.23049926757812
nll mean: 143.97276306152344 	 kl mean: 1.2071609497070312 	 loss mean: 145.179931640625
nll mean: 143.8599853515625 	 kl mean: 1.2071609497070312 	 loss mean: 145.06715393066406


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.15it/s]
 40%|████      | 4/10 [00:00<00:00, 10.89it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.15it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.15it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.92it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.91it/s][A

nll mean: 144.16586303710938 	 kl mean: 1.2071609497070312 	 loss mean: 145.37303161621094
nll mean: 143.99679565429688 	 kl mean: 1.2071609497070312 	 loss mean: 145.20396423339844
nll mean: 144.04502868652344 	 kl mean: 1.2071609497070312 	 loss mean: 145.25218200683594


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.15it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.15it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.91it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.90it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 144.02040100097656 	 kl mean: 1.2071609497070312 	 loss mean: 145.22756958007812
nll mean: 143.86705017089844 	 kl mean: 1.2071609497070312 	 loss mean: 145.07421875
nll mean: 132.0697784423828 	 kl mean: 1.1326091289520264 	 loss mean: 133.202392578125


                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 13.88it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.86it/s][A

nll mean: 131.92141723632812 	 kl mean: 1.1326091289520264 	 loss mean: 133.05401611328125
nll mean: 131.92869567871094 	 kl mean: 1.1326091289520264 	 loss mean: 133.06130981445312
nll mean: 131.69241333007812 	 kl mean: 1.1326091289520264 	 loss mean: 132.8250274658203


                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
 40%|████      | 4/10 [00:00<00:00, 13.86it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.96it/s][A

nll mean: 132.21351623535156 	 kl mean: 1.1326091289520264 	 loss mean: 133.34613037109375
nll mean: 132.0070343017578 	 kl mean: 1.1326091289520264 	 loss mean: 133.1396484375
nll mean: 132.00596618652344 	 kl mean: 1.1326091289520264 	 loss mean: 133.1385498046875


                                              
 11%|█         | 4/38 [00:03<00:20,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.96it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.66it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.66it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.93it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.91it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 131.92153930664062 	 kl mean: 1.1326091289520264 	 loss mean: 133.05413818359375
nll mean: 132.08831787109375 	 kl mean: 1.1326091289520264 	 loss mean: 133.22093200683594
nll mean: 132.07786560058594 	 kl mean: 1.1326091289520264 	 loss mean: 133.21047973632812


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 14.84it/s][A

nll mean: 129.7901611328125 	 kl mean: 1.0638043880462646 	 loss mean: 130.85397338867188
nll mean: 129.47897338867188 	 kl mean: 1.0638043880462646 	 loss mean: 130.54278564453125
nll mean: 129.39508056640625 	 kl mean: 1.0638043880462646 	 loss mean: 130.45887756347656


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 14.84it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 40%|████      | 4/10 [00:00<00:00, 14.57it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.44it/s][A

nll mean: 129.5034942626953 	 kl mean: 1.0638043880462646 	 loss mean: 130.5673065185547
nll mean: 129.585205078125 	 kl mean: 1.0638043880462646 	 loss mean: 130.6490020751953
nll mean: 129.49002075195312 	 kl mean: 1.0638043880462646 	 loss mean: 130.5538330078125


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.44it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.27it/s][A

nll mean: 129.49411010742188 	 kl mean: 1.0638043880462646 	 loss mean: 130.5579071044922
nll mean: 129.40731811523438 	 kl mean: 1.0638043880462646 	 loss mean: 130.47109985351562
nll mean: 129.67822265625 	 kl mean: 1.0638043880462646 	 loss mean: 130.74203491210938


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.27it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.15it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 24.99it/s][A

nll mean: 129.51171875 	 kl mean: 1.0638043880462646 	 loss mean: 130.57553100585938
nll mean: 139.960693359375 	 kl mean: 0.9691920280456543 	 loss mean: 140.9298858642578
nll mean: 140.17840576171875 	 kl mean: 0.9691920280456543 	 loss mean: 141.14759826660156
nll mean: 140.04275512695312 	 kl mean: 0.9691920280456543 	 loss mean: 141.01194763183594
nll mean: 140.1088104248047 	 kl mean: 0.9691920280456543 	 loss mean: 141.07798767089844


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 24.99it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.77it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.80it/s][A

nll mean: 139.79214477539062 	 kl mean: 0.9691920280456543 	 loss mean: 140.76133728027344
nll mean: 139.77146911621094 	 kl mean: 0.9691920280456543 	 loss mean: 140.74066162109375
nll mean: 139.85403442382812 	 kl mean: 0.9691920280456543 	 loss mean: 140.82322692871094
nll mean: 139.8268280029297 	 kl mean: 0.9691920280456543 	 loss mean: 140.7960205078125
nll mean: 139.9037628173828 	 kl mean: 0.9691920280456543 	 loss mean: 140.87295532226562


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
100%|██████████| 10/10 [00:00<00:00, 24.68it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 25.26it/s][A

nll mean: 140.134033203125 	 kl mean: 0.9691920280456543 	 loss mean: 141.10324096679688
nll mean: 111.4317626953125 	 kl mean: 1.2008655071258545 	 loss mean: 112.63263702392578
nll mean: 111.34956359863281 	 kl mean: 1.2008655071258545 	 loss mean: 112.55043029785156
nll mean: 111.4403076171875 	 kl mean: 1.2008655071258545 	 loss mean: 112.64117431640625
nll mean: 111.19339752197266 	 kl mean: 1.2008655071258545 	 loss mean: 112.39427185058594


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 25.26it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.13it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.02it/s][A

nll mean: 111.14527893066406 	 kl mean: 1.2008655071258545 	 loss mean: 112.34614562988281
nll mean: 110.87857818603516 	 kl mean: 1.2008655071258545 	 loss mean: 112.07943725585938
nll mean: 111.42018127441406 	 kl mean: 1.2008655071258545 	 loss mean: 112.62104797363281
nll mean: 111.31332397460938 	 kl mean: 1.2008655071258545 	 loss mean: 112.51419067382812
nll mean: 111.22840881347656 	 kl mean: 1.2008655071258545 	 loss mean: 112.42927551269531


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
100%|██████████| 10/10 [00:00<00:00, 24.83it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.56it/s][A

nll mean: 111.2826156616211 	 kl mean: 1.2008655071258545 	 loss mean: 112.48348236083984
nll mean: 136.05372619628906 	 kl mean: 1.1902151107788086 	 loss mean: 137.2439422607422
nll mean: 136.2705078125 	 kl mean: 1.1902151107788086 	 loss mean: 137.46072387695312


                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
 20%|██        | 2/10 [00:00<00:00, 14.56it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
 40%|████      | 4/10 [00:00<00:00, 14.51it/s][A

nll mean: 136.26429748535156 	 kl mean: 1.1902151107788086 	 loss mean: 137.45452880859375
nll mean: 136.1395263671875 	 kl mean: 1.1902151107788086 	 loss mean: 137.32974243164062
nll mean: 136.101806640625 	 kl mean: 1.1902151107788086 	 loss mean: 137.29202270507812
nll mean: 136.33670043945312 	 kl mean: 1.1902151107788086 	 loss mean: 137.52691650390625



                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.88it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]

nll mean: 136.38279724121094 	 kl mean: 1.1902151107788086 	 loss mean: 137.57301330566406
nll mean: 136.30392456054688 	 kl mean: 1.1902151107788086 	 loss mean: 137.494140625
nll mean: 136.20709228515625 	 kl mean: 1.1902151107788086 	 loss mean: 137.39730834960938
nll mean: 136.29676818847656 	 kl mean: 1.1902151107788086 	 loss mean: 137.48699951171875



 80%|████████  | 8/10 [00:00<00:00, 14.79it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.75it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.58it/s][A

nll mean: 136.72679138183594 	 kl mean: 0.9699894785881042 	 loss mean: 137.69677734375
nll mean: 136.57974243164062 	 kl mean: 0.9699894785881042 	 loss mean: 137.54974365234375
nll mean: 136.4919891357422 	 kl mean: 0.9699894785881042 	 loss mean: 137.46197509765625
nll mean: 136.5079345703125 	 kl mean: 0.9699894785881042 	 loss mean: 137.47793579101562
nll mean: 136.63497924804688 	 kl mean: 0.9699894785881042 	 loss mean: 137.60496520996094


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.58it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.45it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
100%|██████████| 10/10 [00:00<00:00, 21.33it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 136.51608276367188 	 kl mean: 0.9699894785881042 	 loss mean: 137.486083984375
nll mean: 136.5166778564453 	 kl mean: 0.9699894785881042 	 loss mean: 137.48667907714844
nll mean: 136.4569091796875 	 kl mean: 0.9699894785881042 	 loss mean: 137.42689514160156
nll mean: 136.66229248046875 	 kl mean: 0.9699894785881042 	 loss mean: 137.63229370117188
nll mean: 136.6012420654297 	 kl mean: 0.9699894785881042 	 loss mean: 137.57122802734375


                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 30%|███       | 3/10 [00:00<00:00, 24.73it/s][A

nll mean: 125.13330078125 	 kl mean: 1.2297024726867676 	 loss mean: 126.36300659179688
nll mean: 125.30501556396484 	 kl mean: 1.2297024726867676 	 loss mean: 126.53472137451172
nll mean: 125.344970703125 	 kl mean: 1.2297024726867676 	 loss mean: 126.57467651367188
nll mean: 125.16290283203125 	 kl mean: 1.2297024726867676 	 loss mean: 126.3926010131836
nll mean: 125.10436248779297 	 kl mean: 1.2297024726867676 	 loss mean: 126.33406066894531


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 30%|███       | 3/10 [00:00<00:00, 24.73it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.78it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
100%|██████████| 10/10 [00:00<00:00, 24.74it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 125.10231018066406 	 kl mean: 1.2297024726867676 	 loss mean: 126.3320083618164
nll mean: 125.12195587158203 	 kl mean: 1.2297024726867676 	 loss mean: 126.35166931152344
nll mean: 125.07616424560547 	 kl mean: 1.2297024726867676 	 loss mean: 126.30586242675781
nll mean: 125.12564849853516 	 kl mean: 1.2297024726867676 	 loss mean: 126.3553466796875
nll mean: 124.89349365234375 	 kl mean: 1.2297024726867676 	 loss mean: 126.12319946289062


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 30%|███       | 3/10 [00:00<00:00, 21.66it/s][A

nll mean: 147.71829223632812 	 kl mean: 1.173799991607666 	 loss mean: 148.89208984375
nll mean: 147.7684783935547 	 kl mean: 1.173799991607666 	 loss mean: 148.94229125976562
nll mean: 147.6708984375 	 kl mean: 1.173799991607666 	 loss mean: 148.84471130371094
nll mean: 147.4422149658203 	 kl mean: 1.173799991607666 	 loss mean: 148.6160125732422
nll mean: 147.66659545898438 	 kl mean: 1.173799991607666 	 loss mean: 148.8404083251953


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 30%|███       | 3/10 [00:00<00:00, 21.66it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.39it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
100%|██████████| 10/10 [00:00<00:00, 21.27it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 147.23292541503906 	 kl mean: 1.173799991607666 	 loss mean: 148.40672302246094
nll mean: 147.75592041015625 	 kl mean: 1.173799991607666 	 loss mean: 148.92971801757812
nll mean: 147.37176513671875 	 kl mean: 1.173799991607666 	 loss mean: 148.54556274414062
nll mean: 147.41586303710938 	 kl mean: 1.173799991607666 	 loss mean: 148.58966064453125
nll mean: 147.59893798828125 	 kl mean: 1.173799991607666 	 loss mean: 148.7727508544922


                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
 20%|██        | 2/10 [00:00<00:00, 12.84it/s][A

nll mean: 124.62911224365234 	 kl mean: 1.4119101762771606 	 loss mean: 126.04102325439453
nll mean: 124.74150085449219 	 kl mean: 1.4119101762771606 	 loss mean: 126.15341186523438
nll mean: 124.44856262207031 	 kl mean: 1.4119101762771606 	 loss mean: 125.8604736328125


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
 20%|██        | 2/10 [00:00<00:00, 12.84it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
 40%|████      | 4/10 [00:00<00:00, 12.77it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.73it/s][A

nll mean: 124.44384765625 	 kl mean: 1.4119101762771606 	 loss mean: 125.85576629638672
nll mean: 124.4238510131836 	 kl mean: 1.4119101762771606 	 loss mean: 125.83575439453125
nll mean: 124.33111572265625 	 kl mean: 1.4119101762771606 	 loss mean: 125.74302673339844


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.73it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.72it/s][A

nll mean: 124.48110961914062 	 kl mean: 1.4119101762771606 	 loss mean: 125.89302062988281
nll mean: 124.49761199951172 	 kl mean: 1.4119101762771606 	 loss mean: 125.90951538085938
nll mean: 124.52095031738281 	 kl mean: 1.4119101762771606 	 loss mean: 125.932861328125


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.72it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.62it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.64102172851562 	 kl mean: 1.4119101762771606 	 loss mean: 126.05293273925781
nll mean: 168.90670776367188 	 kl mean: 1.2732301950454712 	 loss mean: 170.17994689941406
nll mean: 168.75619506835938 	 kl mean: 1.2732301950454712 	 loss mean: 170.0294189453125



                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 20%|██        | 2/10 [00:00<00:00, 10.18it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 10.13it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.13it/s][A

nll mean: 168.83290100097656 	 kl mean: 1.2732301950454712 	 loss mean: 170.1061248779297
nll mean: 168.65390014648438 	 kl mean: 1.2732301950454712 	 loss mean: 169.9271240234375
nll mean: 168.77767944335938 	 kl mean: 1.2732301950454712 	 loss mean: 170.05091857910156


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.13it/s][A
                                               [A
                                              

nll mean: 168.77694702148438 	 kl mean: 1.2732301950454712 	 loss mean: 170.0501708984375
nll mean: 168.72705078125 	 kl mean: 1.2732301950454712 	 loss mean: 170.00027465820312


 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.11it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.06it/s][A
                                               [A

nll mean: 168.80429077148438 	 kl mean: 1.2732301950454712 	 loss mean: 170.07752990722656
nll mean: 168.77264404296875 	 kl mean: 1.2732301950454712 	 loss mean: 170.04586791992188



 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 90%|█████████ | 9/10 [00:00<00:00, 10.00it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.04it/s][A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 20%|██        | 2/10 [00:00<00:00, 17.93it/s][A

nll mean: 168.72659301757812 	 kl mean: 1.2732301950454712 	 loss mean: 169.99981689453125
nll mean: 141.56292724609375 	 kl mean: 1.1138782501220703 	 loss mean: 142.6768035888672
nll mean: 141.25942993164062 	 kl mean: 1.1138782501220703 	 loss mean: 142.37332153320312
nll mean: 141.21499633789062 	 kl mean: 1.1138782501220703 	 loss mean: 142.32887268066406


                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 20%|██        | 2/10 [00:00<00:00, 17.93it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 40%|████      | 4/10 [00:00<00:00, 17.84it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 60%|██████    | 6/10 [00:00<00:00, 17.90it/s][A

nll mean: 141.25848388671875 	 kl mean: 1.1138782501220703 	 loss mean: 142.37234497070312
nll mean: 141.2645263671875 	 kl mean: 1.1138782501220703 	 loss mean: 142.37841796875
nll mean: 141.2864990234375 	 kl mean: 1.1138782501220703 	 loss mean: 142.40037536621094
nll mean: 141.21612548828125 	 kl mean: 1.1138782501220703 	 loss mean: 142.33001708984375


                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 60%|██████    | 6/10 [00:00<00:00, 17.90it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:16,  1.41it/s]
 80%|████████  | 8/10 [00:00<00:00, 17.91it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.90it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 141.42269897460938 	 kl mean: 1.1138782501220703 	 loss mean: 142.5365753173828
nll mean: 141.40252685546875 	 kl mean: 1.1138782501220703 	 loss mean: 142.51641845703125
nll mean: 141.28463745117188 	 kl mean: 1.1138782501220703 	 loss mean: 142.39852905273438


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 20%|██        | 2/10 [00:00<00:00, 10.80it/s][A

nll mean: 149.65748596191406 	 kl mean: 1.3557846546173096 	 loss mean: 151.0132598876953
nll mean: 149.60812377929688 	 kl mean: 1.3557846546173096 	 loss mean: 150.96392822265625
nll mean: 149.64425659179688 	 kl mean: 1.3557846546173096 	 loss mean: 151.0000457763672


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 20%|██        | 2/10 [00:00<00:00, 10.80it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 40%|████      | 4/10 [00:00<00:00, 10.81it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.82it/s][A

nll mean: 149.4610595703125 	 kl mean: 1.3557846546173096 	 loss mean: 150.8168487548828
nll mean: 149.86669921875 	 kl mean: 1.3557846546173096 	 loss mean: 151.22250366210938
nll mean: 149.6649627685547 	 kl mean: 1.3557846546173096 	 loss mean: 151.020751953125


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.82it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.81it/s][A

nll mean: 149.44003295898438 	 kl mean: 1.3557846546173096 	 loss mean: 150.79580688476562
nll mean: 149.31971740722656 	 kl mean: 1.3557846546173096 	 loss mean: 150.67550659179688
nll mean: 149.62094116210938 	 kl mean: 1.3557846546173096 	 loss mean: 150.97671508789062


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.81it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.77it/s][A
 42%|████▏     | 16/38 [00:09<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 24.52it/s][A

nll mean: 149.73284912109375 	 kl mean: 1.3557846546173096 	 loss mean: 151.088623046875
nll mean: 150.70285034179688 	 kl mean: 1.0873464345932007 	 loss mean: 151.7902069091797
nll mean: 150.8646697998047 	 kl mean: 1.0873464345932007 	 loss mean: 151.9520263671875
nll mean: 151.0106201171875 	 kl mean: 1.0873464345932007 	 loss mean: 152.09796142578125
nll mean: 150.99606323242188 	 kl mean: 1.0873464345932007 	 loss mean: 152.0834197998047


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 24.52it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.42it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.27it/s][A

nll mean: 151.02346801757812 	 kl mean: 1.0873464345932007 	 loss mean: 152.11080932617188
nll mean: 151.20046997070312 	 kl mean: 1.0873464345932007 	 loss mean: 152.28781127929688
nll mean: 150.81582641601562 	 kl mean: 1.0873464345932007 	 loss mean: 151.90318298339844
nll mean: 151.16714477539062 	 kl mean: 1.0873464345932007 	 loss mean: 152.25448608398438
nll mean: 150.88174438476562 	 kl mean: 1.0873464345932007 	 loss mean: 151.96908569335938


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
100%|██████████| 10/10 [00:00<00:00, 24.20it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]

nll mean: 150.91146850585938 	 kl mean: 1.0873464345932007 	 loss mean: 151.99880981445312
nll mean: 138.79086303710938 	 kl mean: 1.1299684047698975 	 loss mean: 139.92080688476562
nll mean: 138.89889526367188 	 kl mean: 1.1299684047698975 	 loss mean: 140.02883911132812
nll mean: 138.9122314453125 	 kl mean: 1.1299684047698975 	 loss mean: 140.04220581054688
nll mean: 139.09783935546875 	 kl mean: 1.1299684047698975 	 loss mean: 140.22781372070312
nll mean: 138.92034912109375 	 kl mean: 1.1299684047698975 	 loss mean: 140.05032348632812



                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 25.58it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.40it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
100%|██████████| 10/10 [00:00<00:00, 25.10it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 139.1482391357422 	 kl mean: 1.1299684047698975 	 loss mean: 140.2781982421875
nll mean: 138.93617248535156 	 kl mean: 1.1299684047698975 	 loss mean: 140.06614685058594
nll mean: 138.85733032226562 	 kl mean: 1.1299684047698975 	 loss mean: 139.9873046875
nll mean: 138.82333374023438 	 kl mean: 1.1299684047698975 	 loss mean: 139.95330810546875
nll mean: 138.86231994628906 	 kl mean: 1.1299684047698975 	 loss mean: 139.99227905273438


                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 20%|██        | 2/10 [00:00<00:00, 12.55it/s][A

nll mean: 135.9083251953125 	 kl mean: 1.1294894218444824 	 loss mean: 137.03781127929688
nll mean: 135.95791625976562 	 kl mean: 1.1294894218444824 	 loss mean: 137.08743286132812
nll mean: 135.99330139160156 	 kl mean: 1.1294894218444824 	 loss mean: 137.122802734375


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 20%|██        | 2/10 [00:00<00:00, 12.55it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 40%|████      | 4/10 [00:00<00:00, 12.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.69it/s][A

nll mean: 136.0216522216797 	 kl mean: 1.1294894218444824 	 loss mean: 137.15115356445312
nll mean: 135.98812866210938 	 kl mean: 1.1294894218444824 	 loss mean: 137.1175994873047
nll mean: 136.24407958984375 	 kl mean: 1.1294894218444824 	 loss mean: 137.37356567382812


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.69it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.73it/s][A

nll mean: 135.84036254882812 	 kl mean: 1.1294894218444824 	 loss mean: 136.9698486328125
nll mean: 135.89663696289062 	 kl mean: 1.1294894218444824 	 loss mean: 137.02613830566406
nll mean: 136.07107543945312 	 kl mean: 1.1294894218444824 	 loss mean: 137.2005615234375


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.73it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.67it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.64it/s][A

nll mean: 135.96038818359375 	 kl mean: 1.1294894218444824 	 loss mean: 137.08987426757812
nll mean: 153.6085205078125 	 kl mean: 1.0493947267532349 	 loss mean: 154.65792846679688
nll mean: 153.59112548828125 	 kl mean: 1.0493947267532349 	 loss mean: 154.64053344726562


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 12.64it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
 40%|████      | 4/10 [00:00<00:00, 12.66it/s][A

nll mean: 153.63687133789062 	 kl mean: 1.0493947267532349 	 loss mean: 154.686279296875
nll mean: 153.757080078125 	 kl mean: 1.0493947267532349 	 loss mean: 154.80648803710938
nll mean: 153.490966796875 	 kl mean: 1.0493947267532349 	 loss mean: 154.5403594970703


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
 40%|████      | 4/10 [00:00<00:00, 12.66it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.73it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.74it/s][A

nll mean: 153.80227661132812 	 kl mean: 1.0493947267532349 	 loss mean: 154.8516845703125
nll mean: 153.53146362304688 	 kl mean: 1.0493947267532349 	 loss mean: 154.58084106445312
nll mean: 153.89227294921875 	 kl mean: 1.0493947267532349 	 loss mean: 154.941650390625


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.74it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.72it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 153.5413818359375 	 kl mean: 1.0493947267532349 	 loss mean: 154.5907745361328
nll mean: 153.7935028076172 	 kl mean: 1.0493947267532349 	 loss mean: 154.8428955078125
nll mean: 162.94920349121094 	 kl mean: 1.1052253246307373 	 loss mean: 164.054443359375


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 12.52it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.52it/s][A

nll mean: 162.89535522460938 	 kl mean: 1.1052253246307373 	 loss mean: 164.00057983398438
nll mean: 162.92755126953125 	 kl mean: 1.1052253246307373 	 loss mean: 164.03277587890625
nll mean: 162.67529296875 	 kl mean: 1.1052253246307373 	 loss mean: 163.780517578125


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 12.52it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.48it/s][A

nll mean: 162.99668884277344 	 kl mean: 1.1052253246307373 	 loss mean: 164.10191345214844
nll mean: 162.80648803710938 	 kl mean: 1.1052253246307373 	 loss mean: 163.91171264648438
nll mean: 162.8946533203125 	 kl mean: 1.1052253246307373 	 loss mean: 163.9998779296875


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.48it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.46it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.57it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.61it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 162.87344360351562 	 kl mean: 1.1052253246307373 	 loss mean: 163.97866821289062
nll mean: 162.95977783203125 	 kl mean: 1.1052253246307373 	 loss mean: 164.06500244140625
nll mean: 162.86541748046875 	 kl mean: 1.1052253246307373 	 loss mean: 163.97064208984375


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 10.44it/s][A

nll mean: 123.87293243408203 	 kl mean: 1.176811933517456 	 loss mean: 125.04974365234375
nll mean: 123.96236419677734 	 kl mean: 1.176811933517456 	 loss mean: 125.13917541503906
nll mean: 124.07158660888672 	 kl mean: 1.176811933517456 	 loss mean: 125.24840545654297


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 10.44it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 40%|████      | 4/10 [00:00<00:00, 10.43it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.44it/s][A

nll mean: 123.94136810302734 	 kl mean: 1.176811933517456 	 loss mean: 125.11817932128906
nll mean: 123.86205291748047 	 kl mean: 1.176811933517456 	 loss mean: 125.03886413574219
nll mean: 124.05335998535156 	 kl mean: 1.176811933517456 	 loss mean: 125.23017120361328


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.44it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.41it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 10.27it/s][A

nll mean: 123.99853515625 	 kl mean: 1.176811933517456 	 loss mean: 125.17533111572266
nll mean: 124.12940979003906 	 kl mean: 1.176811933517456 	 loss mean: 125.30622863769531
nll mean: 124.08152770996094 	 kl mean: 1.176811933517456 	 loss mean: 125.25833892822266


                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
100%|██████████| 10/10 [00:00<00:00, 10.34it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
 40%|████      | 4/10 [00:00<00:00, 33.36it/s][A

nll mean: 124.33385467529297 	 kl mean: 1.176811933517456 	 loss mean: 125.51065826416016
nll mean: 111.8647689819336 	 kl mean: 0.8192873001098633 	 loss mean: 112.68405151367188
nll mean: 112.06072998046875 	 kl mean: 0.8192873001098633 	 loss mean: 112.8800048828125
nll mean: 111.94619750976562 	 kl mean: 0.8192873001098633 	 loss mean: 112.76548767089844
nll mean: 111.95903015136719 	 kl mean: 0.8192873001098633 	 loss mean: 112.7783203125
nll mean: 111.99114227294922 	 kl mean: 0.8192873001098633 	 loss mean: 112.8104248046875
nll mean: 111.98063659667969 	 kl mean: 0.8192873001098633 	 loss mean: 112.7999267578125


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
 40%|████      | 4/10 [00:00<00:00, 33.36it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
100%|██████████| 10/10 [00:00<00:00, 32.85it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 111.89685821533203 	 kl mean: 0.8192873001098633 	 loss mean: 112.71614074707031
nll mean: 111.8955078125 	 kl mean: 0.8192873001098633 	 loss mean: 112.71479797363281
nll mean: 111.90217590332031 	 kl mean: 0.8192873001098633 	 loss mean: 112.7214584350586
nll mean: 112.02947235107422 	 kl mean: 0.8192873001098633 	 loss mean: 112.84876251220703
nll mean: 165.0636749267578 	 kl mean: 1.0016179084777832 	 loss mean: 166.0653076171875


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 14.56it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.57it/s][A

nll mean: 164.96499633789062 	 kl mean: 1.0016179084777832 	 loss mean: 165.96661376953125
nll mean: 164.93069458007812 	 kl mean: 1.0016179084777832 	 loss mean: 165.93231201171875
nll mean: 165.00296020507812 	 kl mean: 1.0016179084777832 	 loss mean: 166.00457763671875


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
 40%|████      | 4/10 [00:00<00:00, 14.57it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.60it/s][A

nll mean: 164.73208618164062 	 kl mean: 1.0016179084777832 	 loss mean: 165.73370361328125
nll mean: 165.104736328125 	 kl mean: 1.0016179084777832 	 loss mean: 166.10635375976562
nll mean: 164.73046875 	 kl mean: 1.0016179084777832 	 loss mean: 165.73208618164062


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.60it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.55it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.55it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.67it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.67it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 164.87493896484375 	 kl mean: 1.0016179084777832 	 loss mean: 165.87655639648438
nll mean: 164.93310546875 	 kl mean: 1.0016179084777832 	 loss mean: 165.93472290039062
nll mean: 164.85174560546875 	 kl mean: 1.0016179084777832 	 loss mean: 165.8533477783203
nll mean: 126.25122833251953 	 kl mean: 1.0772547721862793 	 loss mean: 127.3284912109375


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 22.18it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.87it/s][A

nll mean: 126.16830444335938 	 kl mean: 1.0772547721862793 	 loss mean: 127.24555969238281
nll mean: 126.37947082519531 	 kl mean: 1.0772547721862793 	 loss mean: 127.45671844482422
nll mean: 126.35318756103516 	 kl mean: 1.0772547721862793 	 loss mean: 127.43045043945312
nll mean: 126.26171875 	 kl mean: 1.0772547721862793 	 loss mean: 127.3389663696289
nll mean: 126.46847534179688 	 kl mean: 1.0772547721862793 	 loss mean: 127.54573822021484


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.87it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.52it/s]
100%|██████████| 10/10 [00:00<00:00, 21.33it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 126.48159790039062 	 kl mean: 1.0772547721862793 	 loss mean: 127.55885314941406
nll mean: 126.12013244628906 	 kl mean: 1.0772547721862793 	 loss mean: 127.19739532470703
nll mean: 126.26136016845703 	 kl mean: 1.0772547721862793 	 loss mean: 127.338623046875
nll mean: 126.05534362792969 	 kl mean: 1.0772547721862793 	 loss mean: 127.13259887695312


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 14.39it/s][A

nll mean: 120.50907897949219 	 kl mean: 1.0929386615753174 	 loss mean: 121.60202026367188
nll mean: 120.39273834228516 	 kl mean: 1.0929386615753174 	 loss mean: 121.48567199707031
nll mean: 120.79468536376953 	 kl mean: 1.0929386615753174 	 loss mean: 121.88761901855469


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 14.39it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 40%|████      | 4/10 [00:00<00:00, 14.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.50it/s][A

nll mean: 120.65675354003906 	 kl mean: 1.0929386615753174 	 loss mean: 121.74968719482422
nll mean: 120.746826171875 	 kl mean: 1.0929386615753174 	 loss mean: 121.83976745605469
nll mean: 120.6874008178711 	 kl mean: 1.0929386615753174 	 loss mean: 121.78033447265625


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.50it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.51it/s][A

nll mean: 120.73160552978516 	 kl mean: 1.0929386615753174 	 loss mean: 121.82454681396484
nll mean: 120.56204986572266 	 kl mean: 1.0929386615753174 	 loss mean: 121.65498352050781
nll mean: 120.58340454101562 	 kl mean: 1.0929386615753174 	 loss mean: 121.67635345458984


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.51it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.55it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 23.23it/s][A

nll mean: 120.45435333251953 	 kl mean: 1.0929386615753174 	 loss mean: 121.54729461669922
nll mean: 87.35821533203125 	 kl mean: 1.2305424213409424 	 loss mean: 88.58876037597656
nll mean: 87.20953369140625 	 kl mean: 1.2305424213409424 	 loss mean: 88.44007110595703
nll mean: 87.27536010742188 	 kl mean: 1.2305424213409424 	 loss mean: 88.50590515136719
nll mean: 87.26011657714844 	 kl mean: 1.2305424213409424 	 loss mean: 88.49065399169922


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 23.23it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.63it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.65it/s][A

nll mean: 87.29981994628906 	 kl mean: 1.2305424213409424 	 loss mean: 88.53036499023438
nll mean: 87.29220581054688 	 kl mean: 1.2305424213409424 	 loss mean: 88.52274322509766
nll mean: 87.1821060180664 	 kl mean: 1.2305424213409424 	 loss mean: 88.41264343261719
nll mean: 87.33970642089844 	 kl mean: 1.2305424213409424 	 loss mean: 88.57025146484375
nll mean: 87.63948822021484 	 kl mean: 1.2305424213409424 	 loss mean: 88.87003326416016


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
100%|██████████| 10/10 [00:00<00:00, 22.56it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.98it/s][A

nll mean: 87.4183120727539 	 kl mean: 1.2305424213409424 	 loss mean: 88.64885711669922
nll mean: 113.38526153564453 	 kl mean: 0.9276548624038696 	 loss mean: 114.31291198730469
nll mean: 113.24313354492188 	 kl mean: 0.9276548624038696 	 loss mean: 114.17079162597656
nll mean: 113.4071273803711 	 kl mean: 0.9276548624038696 	 loss mean: 114.33477783203125
nll mean: 113.39076232910156 	 kl mean: 0.9276548624038696 	 loss mean: 114.31842041015625


                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.98it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.96it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.89it/s][A

nll mean: 113.7987060546875 	 kl mean: 0.9276548624038696 	 loss mean: 114.72636413574219
nll mean: 113.37313079833984 	 kl mean: 0.9276548624038696 	 loss mean: 114.30078125
nll mean: 113.2914810180664 	 kl mean: 0.9276548624038696 	 loss mean: 114.21913146972656
nll mean: 113.27725219726562 	 kl mean: 0.9276548624038696 	 loss mean: 114.20489501953125
nll mean: 113.32304382324219 	 kl mean: 0.9276548624038696 	 loss mean: 114.25068664550781


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
100%|██████████| 10/10 [00:00<00:00, 21.74it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.54it/s][A

nll mean: 113.27345275878906 	 kl mean: 0.9276548624038696 	 loss mean: 114.20111083984375
nll mean: 126.94502258300781 	 kl mean: 1.0393872261047363 	 loss mean: 127.98442077636719
nll mean: 126.818603515625 	 kl mean: 1.0393872261047363 	 loss mean: 127.85798645019531


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 20%|██        | 2/10 [00:00<00:00, 12.54it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 40%|████      | 4/10 [00:00<00:00, 12.52it/s][A

nll mean: 127.01914978027344 	 kl mean: 1.0393872261047363 	 loss mean: 128.05853271484375
nll mean: 126.6666259765625 	 kl mean: 1.0393872261047363 	 loss mean: 127.70602416992188
nll mean: 127.04039001464844 	 kl mean: 1.0393872261047363 	 loss mean: 128.07977294921875


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 40%|████      | 4/10 [00:00<00:00, 12.52it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.59it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.54it/s][A

nll mean: 127.06463623046875 	 kl mean: 1.0393872261047363 	 loss mean: 128.10403442382812
nll mean: 126.73443603515625 	 kl mean: 1.0393872261047363 	 loss mean: 127.77381896972656
nll mean: 126.74588775634766 	 kl mean: 1.0393872261047363 	 loss mean: 127.78528594970703


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.85it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.54it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.46it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 127.10903930664062 	 kl mean: 1.0393872261047363 	 loss mean: 128.14842224121094
nll mean: 126.7627182006836 	 kl mean: 1.0393872261047363 	 loss mean: 127.8021240234375
nll mean: 65.26873779296875 	 kl mean: 1.5984368324279785 	 loss mean: 66.86717224121094


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 10.27it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 30%|███       | 3/10 [00:00<00:00, 10.18it/s][A

nll mean: 65.39552307128906 	 kl mean: 1.5984368324279785 	 loss mean: 66.99395751953125
nll mean: 65.55545806884766 	 kl mean: 1.5984368324279785 	 loss mean: 67.15389251708984
nll mean: 65.35122680664062 	 kl mean: 1.5984368324279785 	 loss mean: 66.94966125488281


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 30%|███       | 3/10 [00:00<00:00, 10.18it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.23it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.25it/s][A

nll mean: 65.55583190917969 	 kl mean: 1.5984368324279785 	 loss mean: 67.1542739868164
nll mean: 65.77290344238281 	 kl mean: 1.5984368324279785 	 loss mean: 67.37134552001953
nll mean: 65.47864532470703 	 kl mean: 1.5984368324279785 	 loss mean: 67.07708740234375


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.25it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.17it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.26it/s][A
 79%|███████▉  | 30/38 [00:18<00:05,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 65.553955078125 	 kl mean: 1.5984368324279785 	 loss mean: 67.15238952636719
nll mean: 65.47196960449219 	 kl mean: 1.5984368324279785 	 loss mean: 67.07041931152344
nll mean: 65.3207778930664 	 kl mean: 1.5984368324279785 	 loss mean: 66.9192123413086


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 12.93it/s][A

nll mean: 110.06222534179688 	 kl mean: 1.2814726829528809 	 loss mean: 111.34368896484375
nll mean: 110.00972747802734 	 kl mean: 1.2814726829528809 	 loss mean: 111.29119873046875
nll mean: 109.88294982910156 	 kl mean: 1.2814726829528809 	 loss mean: 111.16442108154297


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 12.93it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
 40%|████      | 4/10 [00:00<00:00, 12.86it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.93it/s][A

nll mean: 110.04692840576172 	 kl mean: 1.2814726829528809 	 loss mean: 111.32840728759766
nll mean: 109.86177062988281 	 kl mean: 1.2814726829528809 	 loss mean: 111.14324951171875
nll mean: 109.92539978027344 	 kl mean: 1.2814726829528809 	 loss mean: 111.20687866210938


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.93it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.89it/s][A

nll mean: 109.76933288574219 	 kl mean: 1.2814726829528809 	 loss mean: 111.0508041381836
nll mean: 109.91069030761719 	 kl mean: 1.2814726829528809 	 loss mean: 111.19216918945312
nll mean: 110.060546875 	 kl mean: 1.2814726829528809 	 loss mean: 111.34201049804688


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.38it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.89it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.79it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.34it/s]
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:00,  9.98it/s][A

nll mean: 109.89778137207031 	 kl mean: 1.2814726829528809 	 loss mean: 111.17926025390625
nll mean: 141.90675354003906 	 kl mean: 1.145308494567871 	 loss mean: 143.05206298828125


                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.34it/s]
 10%|█         | 1/10 [00:00<00:00,  9.98it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 20%|██        | 2/10 [00:00<00:00,  9.97it/s]

nll mean: 142.23887634277344 	 kl mean: 1.145308494567871 	 loss mean: 143.38418579101562
nll mean: 142.05218505859375 	 kl mean: 1.145308494567871 	 loss mean: 143.197509765625
nll mean: 142.0501708984375 	 kl mean: 1.145308494567871 	 loss mean: 143.19546508789062


[A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 40%|████      | 4/10 [00:00<00:00,  9.99it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.97it/s][A

nll mean: 142.03033447265625 	 kl mean: 1.145308494567871 	 loss mean: 143.17564392089844
nll mean: 142.02871704101562 	 kl mean: 1.145308494567871 	 loss mean: 143.1740264892578


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.97it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.93it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.90it/s][A

nll mean: 142.092041015625 	 kl mean: 1.145308494567871 	 loss mean: 143.23736572265625
nll mean: 142.0497283935547 	 kl mean: 1.145308494567871 	 loss mean: 143.1950225830078


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.90it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.83it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.88it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 142.04550170898438 	 kl mean: 1.145308494567871 	 loss mean: 143.1907958984375
nll mean: 141.9906005859375 	 kl mean: 1.145308494567871 	 loss mean: 143.13592529296875
nll mean: 66.927734375 	 kl mean: 1.4911516904830933 	 loss mean: 68.41889190673828
nll mean: 66.6821517944336 	 kl mean: 1.4911516904830933 	 loss mean: 68.17329406738281


                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 30%|███       | 3/10 [00:00<00:00, 25.95it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.84it/s][A

nll mean: 66.61595153808594 	 kl mean: 1.4911516904830933 	 loss mean: 68.10710144042969
nll mean: 66.6278076171875 	 kl mean: 1.4911516904830933 	 loss mean: 68.11895751953125
nll mean: 66.72288513183594 	 kl mean: 1.4911516904830933 	 loss mean: 68.21404266357422
nll mean: 66.67709350585938 	 kl mean: 1.4911516904830933 	 loss mean: 68.16825103759766
nll mean: 66.58103942871094 	 kl mean: 1.4911516904830933 	 loss mean: 68.07218933105469
nll mean: 66.954345703125 	 kl mean: 1.4911516904830933 	 loss mean: 68.44549560546875


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.84it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
100%|██████████| 10/10 [00:00<00:00, 25.51it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 21.64it/s][A

nll mean: 66.69487762451172 	 kl mean: 1.4911516904830933 	 loss mean: 68.18603515625
nll mean: 66.66853332519531 	 kl mean: 1.4911516904830933 	 loss mean: 68.15968322753906
nll mean: 124.4574203491211 	 kl mean: 1.0236690044403076 	 loss mean: 125.48109436035156
nll mean: 124.60706329345703 	 kl mean: 1.0236690044403076 	 loss mean: 125.6307373046875
nll mean: 124.5958251953125 	 kl mean: 1.0236690044403076 	 loss mean: 125.61949157714844


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 30%|███       | 3/10 [00:00<00:00, 21.64it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.27it/s][A

nll mean: 124.48735046386719 	 kl mean: 1.0236690044403076 	 loss mean: 125.51102447509766
nll mean: 124.47068786621094 	 kl mean: 1.0236690044403076 	 loss mean: 125.49435424804688
nll mean: 124.42253112792969 	 kl mean: 1.0236690044403076 	 loss mean: 125.44620513916016
nll mean: 124.56077575683594 	 kl mean: 1.0236690044403076 	 loss mean: 125.5844497680664
nll mean: 124.39833068847656 	 kl mean: 1.0236690044403076 	 loss mean: 125.4219970703125


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.27it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
100%|██████████| 10/10 [00:00<00:00, 21.01it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.42047119140625 	 kl mean: 1.0236690044403076 	 loss mean: 125.44413757324219
nll mean: 124.63204956054688 	 kl mean: 1.0236690044403076 	 loss mean: 125.65573120117188
nll mean: 125.36015319824219 	 kl mean: 1.1632795333862305 	 loss mean: 126.5234375


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 12.29it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.37it/s][A

nll mean: 125.61780548095703 	 kl mean: 1.1632795333862305 	 loss mean: 126.78108215332031
nll mean: 125.40855407714844 	 kl mean: 1.1632795333862305 	 loss mean: 126.57183074951172
nll mean: 125.55011749267578 	 kl mean: 1.1632795333862305 	 loss mean: 126.7134017944336


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 40%|████      | 4/10 [00:00<00:00, 12.37it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.40it/s][A

nll mean: 125.4066162109375 	 kl mean: 1.1632795333862305 	 loss mean: 126.56990051269531
nll mean: 125.34754943847656 	 kl mean: 1.1632795333862305 	 loss mean: 126.51083374023438
nll mean: 125.62600708007812 	 kl mean: 1.1632795333862305 	 loss mean: 126.78927612304688


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.40it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.45it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.45it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 125.61701965332031 	 kl mean: 1.1632795333862305 	 loss mean: 126.7802963256836
nll mean: 125.1318359375 	 kl mean: 1.1632795333862305 	 loss mean: 126.29512023925781
nll mean: 125.33634948730469 	 kl mean: 1.1632795333862305 	 loss mean: 126.4996337890625


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.64it/s][A

nll mean: 118.4268569946289 	 kl mean: 1.160081386566162 	 loss mean: 119.58694458007812
nll mean: 118.36810302734375 	 kl mean: 1.160081386566162 	 loss mean: 119.52818298339844
nll mean: 118.58958435058594 	 kl mean: 1.160081386566162 	 loss mean: 119.7496566772461


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.64it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 10.62it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.62it/s][A

nll mean: 118.4809341430664 	 kl mean: 1.160081386566162 	 loss mean: 119.64102172851562
nll mean: 118.3414306640625 	 kl mean: 1.160081386566162 	 loss mean: 119.50151824951172
nll mean: 118.51244354248047 	 kl mean: 1.160081386566162 	 loss mean: 119.67253112792969


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.62it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.61it/s][A

nll mean: 118.4033203125 	 kl mean: 1.160081386566162 	 loss mean: 119.56340026855469
nll mean: 118.64651489257812 	 kl mean: 1.160081386566162 	 loss mean: 119.80659484863281
nll mean: 118.38521575927734 	 kl mean: 1.160081386566162 	 loss mean: 119.54530334472656


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.61it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.61it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 21.71it/s][A

nll mean: 118.5654296875 	 kl mean: 1.160081386566162 	 loss mean: 119.72550964355469
nll mean: 117.40156555175781 	 kl mean: 1.0752837657928467 	 loss mean: 118.47685241699219
nll mean: 117.20748901367188 	 kl mean: 1.0752837657928467 	 loss mean: 118.28276824951172
nll mean: 117.38115692138672 	 kl mean: 1.0752837657928467 	 loss mean: 118.45643615722656
nll mean: 117.52082061767578 	 kl mean: 1.0752837657928467 	 loss mean: 118.59610748291016


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 21.71it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.66it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.54it/s][A

nll mean: 117.45297241210938 	 kl mean: 1.0752837657928467 	 loss mean: 118.52825927734375
nll mean: 117.33679962158203 	 kl mean: 1.0752837657928467 	 loss mean: 118.41207885742188
nll mean: 117.55775451660156 	 kl mean: 1.0752837657928467 	 loss mean: 118.63304138183594
nll mean: 117.32235717773438 	 kl mean: 1.0752837657928467 	 loss mean: 118.39764404296875
nll mean: 117.452880859375 	 kl mean: 1.0752837657928467 	 loss mean: 118.52816009521484


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
100%|██████████| 10/10 [00:00<00:00, 21.69it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 30.60it/s][A

nll mean: 117.24485778808594 	 kl mean: 1.0752837657928467 	 loss mean: 118.32014465332031
nll mean: 89.43209075927734 	 kl mean: 1.7217345237731934 	 loss mean: 91.1538314819336
nll mean: 89.44764709472656 	 kl mean: 1.7217345237731934 	 loss mean: 91.16937255859375
nll mean: 89.0810775756836 	 kl mean: 1.7217345237731934 	 loss mean: 90.80281066894531
nll mean: 89.25679016113281 	 kl mean: 1.7217345237731934 	 loss mean: 90.978515625
nll mean: 89.63554382324219 	 kl mean: 1.7217345237731934 	 loss mean: 91.35728454589844
nll mean: 89.611328125 	 kl mean: 1.7217345237731934 	 loss mean: 91.33306884765625


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 30.60it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
100%|██████████| 10/10 [00:00<00:00, 30.51it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.57it/s]


nll mean: 89.55208587646484 	 kl mean: 1.7217345237731934 	 loss mean: 91.2738265991211
nll mean: 89.22113037109375 	 kl mean: 1.7217345237731934 	 loss mean: 90.94286346435547
nll mean: 89.34355163574219 	 kl mean: 1.7217345237731934 	 loss mean: 91.06526947021484
nll mean: 89.31558227539062 	 kl mean: 1.7217345237731934 	 loss mean: 91.03731536865234
Approximate NLL:
tensor(126.9019, device='cuda:0')
Approximate KL:
tensor(1.1597, device='cuda:0')
Testing took 0:00:25.164946


In [13]:
print(wd_nlls)

[tensor(126.3611, device='cuda:0'), tensor(127.2960, device='cuda:0'), tensor(126.4909, device='cuda:0'), tensor(126.9019, device='cuda:0')]


# Free Bits

In [14]:
saved_model_files = get_model_filenames('freebits_05')
saved_model_files

['results_final/results0/freebits_05/models/sentence_vae_FreeBits_0.5_3500.pt',
 'results_final/results1/freebits_05/models/sentence_vae_FreeBits_0.5_3500.pt',
 'results_final/results2/freebits_05/models/sentence_vae_FreeBits_0.5_3500.pt',
 'results_final/results3/freebits_05/models/sentence_vae_FreeBits_0.5_3500.pt']

In [15]:
fb_nlls, fb_kls = get_approx_nlls(saved_model_files)

  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .05it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .05it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .05it/s][A
                                              

nll mean: 108.69758605957031 	 kl mean: 8.921194076538086 	 loss mean: 117.6187744140625
nll mean: 108.10222625732422 	 kl mean: 8.921194076538086 	 loss mean: 117.02342224121094
nll mean: 108.7293701171875 	 kl mean: 8.921194076538086 	 loss mean: 117.65055847167969
nll mean: 108.33524322509766 	 kl mean: 8.921194076538086 	 loss mean: 117.25643920898438
nll mean: 108.25239562988281 	 kl mean: 8.921194076538086 	 loss mean: 117.17359161376953


  0%|          | 0/38 [00:00<?, ?it/s]
 30%|███       | 3/10 [00:00<00:00, 26.05it/s][A
                                      .70it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .70it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .70it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 25.70it/s][A
                                      .47it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 25.19it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 108.6400375366211 	 kl mean: 8.921194076538086 	 loss mean: 117.56123352050781
nll mean: 108.73342895507812 	 kl mean: 8.921194076538086 	 loss mean: 117.65461730957031
nll mean: 108.94733428955078 	 kl mean: 8.921194076538086 	 loss mean: 117.8685302734375
nll mean: 108.64723205566406 	 kl mean: 8.921194076538086 	 loss mean: 117.56842041015625
nll mean: 108.52285766601562 	 kl mean: 8.921194076538086 	 loss mean: 117.44406127929688


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
 20%|██        | 2/10 [00:00<00:00, 14.27it/s][A

nll mean: 127.15644836425781 	 kl mean: 8.558151245117188 	 loss mean: 135.714599609375
nll mean: 126.66825866699219 	 kl mean: 8.558151245117188 	 loss mean: 135.22640991210938
nll mean: 126.65693664550781 	 kl mean: 8.558151245117188 	 loss mean: 135.215087890625


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
 20%|██        | 2/10 [00:00<00:00, 14.27it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
 40%|████      | 4/10 [00:00<00:00, 14.38it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.24it/s][A

nll mean: 127.0471420288086 	 kl mean: 8.558151245117188 	 loss mean: 135.60528564453125
nll mean: 126.56863403320312 	 kl mean: 8.558151245117188 	 loss mean: 135.1267852783203
nll mean: 126.77742004394531 	 kl mean: 8.558151245117188 	 loss mean: 135.3355712890625


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.24it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.51it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.03it/s][A

nll mean: 127.11512756347656 	 kl mean: 8.558151245117188 	 loss mean: 135.67327880859375
nll mean: 126.91659545898438 	 kl mean: 8.558151245117188 	 loss mean: 135.47474670410156
nll mean: 126.74684143066406 	 kl mean: 8.558151245117188 	 loss mean: 135.30499267578125


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.51it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.03it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.10it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 30%|███       | 3/10 [00:00<00:00, 25.32it/s][A

nll mean: 126.50241088867188 	 kl mean: 8.558151245117188 	 loss mean: 135.06056213378906
nll mean: 98.19339752197266 	 kl mean: 8.06130599975586 	 loss mean: 106.25470733642578
nll mean: 98.30307006835938 	 kl mean: 8.06130599975586 	 loss mean: 106.3643798828125
nll mean: 98.08570861816406 	 kl mean: 8.06130599975586 	 loss mean: 106.14700317382812
nll mean: 98.20149230957031 	 kl mean: 8.06130599975586 	 loss mean: 106.26280212402344


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 30%|███       | 3/10 [00:00<00:00, 25.32it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.02it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.01it/s][A

nll mean: 98.39924621582031 	 kl mean: 8.06130599975586 	 loss mean: 106.46055603027344
nll mean: 98.22097778320312 	 kl mean: 8.06130599975586 	 loss mean: 106.28228759765625
nll mean: 98.1585693359375 	 kl mean: 8.06130599975586 	 loss mean: 106.21987915039062
nll mean: 98.41944885253906 	 kl mean: 8.06130599975586 	 loss mean: 106.48075866699219
nll mean: 97.99172973632812 	 kl mean: 8.06130599975586 	 loss mean: 106.05303955078125


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
100%|██████████| 10/10 [00:00<00:00, 24.89it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.90it/s][A

nll mean: 97.9775390625 	 kl mean: 8.06130599975586 	 loss mean: 106.03884887695312
nll mean: 138.37660217285156 	 kl mean: 8.377578735351562 	 loss mean: 146.75418090820312
nll mean: 138.55789184570312 	 kl mean: 8.377578735351562 	 loss mean: 146.93545532226562


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
 20%|██        | 2/10 [00:00<00:00, 10.90it/s][A
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
 40%|████      | 4/10 [00:00<00:00, 10.90it/s][A

nll mean: 138.7311248779297 	 kl mean: 8.377578735351562 	 loss mean: 147.10870361328125
nll mean: 138.37094116210938 	 kl mean: 8.377578735351562 	 loss mean: 146.74850463867188
nll mean: 138.03158569335938 	 kl mean: 8.377578735351562 	 loss mean: 146.4091796875


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.14it/s]
 40%|████      | 4/10 [00:00<00:00, 10.90it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.14it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.14it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.87it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.87it/s][A

nll mean: 138.41244506835938 	 kl mean: 8.377578735351562 	 loss mean: 146.7900390625
nll mean: 138.62611389160156 	 kl mean: 8.377578735351562 	 loss mean: 147.00369262695312
nll mean: 138.38140869140625 	 kl mean: 8.377578735351562 	 loss mean: 146.7589874267578


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.14it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.14it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.87it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.86it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 138.46241760253906 	 kl mean: 8.377578735351562 	 loss mean: 146.83999633789062
nll mean: 138.40777587890625 	 kl mean: 8.377578735351562 	 loss mean: 146.78533935546875
nll mean: 125.15715026855469 	 kl mean: 8.027483940124512 	 loss mean: 133.18463134765625


                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 13.90it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.99it/s][A

nll mean: 125.14726257324219 	 kl mean: 8.027483940124512 	 loss mean: 133.17474365234375
nll mean: 124.70587158203125 	 kl mean: 8.027483940124512 	 loss mean: 132.7333526611328
nll mean: 124.94406127929688 	 kl mean: 8.027483940124512 	 loss mean: 132.97154235839844


                                              
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
 40%|████      | 4/10 [00:00<00:00, 13.99it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.12it/s][A

nll mean: 124.91390991210938 	 kl mean: 8.027483940124512 	 loss mean: 132.94139099121094
nll mean: 125.1506576538086 	 kl mean: 8.027483940124512 	 loss mean: 133.1781463623047
nll mean: 125.39730834960938 	 kl mean: 8.027483940124512 	 loss mean: 133.4248046875


                                              
 11%|█         | 4/38 [00:03<00:20,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.12it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.66it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.66it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.17it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.16it/s][A
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.61593627929688 	 kl mean: 8.027483940124512 	 loss mean: 132.64341735839844
nll mean: 124.7744140625 	 kl mean: 8.027483940124512 	 loss mean: 132.80189514160156
nll mean: 125.06221008300781 	 kl mean: 8.027483940124512 	 loss mean: 133.08969116210938


                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 14.59it/s][A

nll mean: 122.45164489746094 	 kl mean: 8.247314453125 	 loss mean: 130.69895935058594
nll mean: 122.41213989257812 	 kl mean: 8.247314453125 	 loss mean: 130.65945434570312
nll mean: 122.826171875 	 kl mean: 8.247314453125 	 loss mean: 131.073486328125


                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 14.59it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
 40%|████      | 4/10 [00:00<00:00, 14.46it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.23it/s][A

nll mean: 123.00331115722656 	 kl mean: 8.247314453125 	 loss mean: 131.25064086914062
nll mean: 122.42304229736328 	 kl mean: 8.247314453125 	 loss mean: 130.67034912109375
nll mean: 122.58777618408203 	 kl mean: 8.247314453125 	 loss mean: 130.8350830078125


                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.23it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.26it/s][A

nll mean: 121.91326904296875 	 kl mean: 8.247314453125 	 loss mean: 130.16058349609375
nll mean: 122.31292724609375 	 kl mean: 8.247314453125 	 loss mean: 130.56024169921875
nll mean: 122.51364135742188 	 kl mean: 8.247314453125 	 loss mean: 130.76095581054688


                                              
 13%|█▎        | 5/38 [00:03<00:20,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.26it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.18it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 25.40it/s][A

nll mean: 122.58440399169922 	 kl mean: 8.247314453125 	 loss mean: 130.8317108154297
nll mean: 133.1619415283203 	 kl mean: 7.908991813659668 	 loss mean: 141.0709228515625
nll mean: 133.1957244873047 	 kl mean: 7.908991813659668 	 loss mean: 141.10470581054688
nll mean: 133.5667266845703 	 kl mean: 7.908991813659668 	 loss mean: 141.4757080078125
nll mean: 133.0059814453125 	 kl mean: 7.908991813659668 	 loss mean: 140.9149627685547


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 25.40it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.22it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.03it/s][A

nll mean: 132.77574157714844 	 kl mean: 7.908991813659668 	 loss mean: 140.68472290039062
nll mean: 133.28289794921875 	 kl mean: 7.908991813659668 	 loss mean: 141.19189453125
nll mean: 133.111572265625 	 kl mean: 7.908991813659668 	 loss mean: 141.02056884765625
nll mean: 132.9473876953125 	 kl mean: 7.908991813659668 	 loss mean: 140.85638427734375
nll mean: 133.07740783691406 	 kl mean: 7.908991813659668 	 loss mean: 140.98641967773438


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
100%|██████████| 10/10 [00:00<00:00, 24.87it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
 30%|███       | 3/10 [00:00<00:00, 25.13it/s][A

nll mean: 133.44366455078125 	 kl mean: 7.908991813659668 	 loss mean: 141.3526611328125
nll mean: 104.66587829589844 	 kl mean: 7.941777229309082 	 loss mean: 112.60765075683594
nll mean: 104.9539566040039 	 kl mean: 7.941777229309082 	 loss mean: 112.8957290649414
nll mean: 105.04603576660156 	 kl mean: 7.941777229309082 	 loss mean: 112.98780822753906
nll mean: 105.36015319824219 	 kl mean: 7.941777229309082 	 loss mean: 113.30192565917969


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
 30%|███       | 3/10 [00:00<00:00, 25.13it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.99it/s][A
                                              [A


nll mean: 104.60580444335938 	 kl mean: 7.941777229309082 	 loss mean: 112.5475845336914
nll mean: 104.77484893798828 	 kl mean: 7.941777229309082 	 loss mean: 112.71662902832031
nll mean: 104.95291137695312 	 kl mean: 7.941777229309082 	 loss mean: 112.89468383789062
nll mean: 104.8549575805664 	 kl mean: 7.941777229309082 	 loss mean: 112.7967300415039
nll mean: 104.86433410644531 	 kl mean: 7.941777229309082 	 loss mean: 112.80610656738281


 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
100%|██████████| 10/10 [00:00<00:00, 24.85it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.39it/s][A

nll mean: 105.5779037475586 	 kl mean: 7.941777229309082 	 loss mean: 113.5196762084961
nll mean: 130.7199249267578 	 kl mean: 8.397895812988281 	 loss mean: 139.11781311035156
nll mean: 131.11129760742188 	 kl mean: 8.397895812988281 	 loss mean: 139.50918579101562


                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
 20%|██        | 2/10 [00:00<00:00, 14.39it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
 40%|████      | 4/10 [00:00<00:00, 14.43it/s][A

nll mean: 131.48654174804688 	 kl mean: 8.397895812988281 	 loss mean: 139.88442993164062
nll mean: 131.46778869628906 	 kl mean: 8.397895812988281 	 loss mean: 139.86569213867188
nll mean: 130.89419555664062 	 kl mean: 8.397895812988281 	 loss mean: 139.29208374023438


                                              
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
 40%|████      | 4/10 [00:00<00:00, 14.43it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.38it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.87it/s][A

nll mean: 131.5037841796875 	 kl mean: 8.397895812988281 	 loss mean: 139.9016876220703
nll mean: 131.3963623046875 	 kl mean: 8.397895812988281 	 loss mean: 139.79425048828125
nll mean: 131.14865112304688 	 kl mean: 8.397895812988281 	 loss mean: 139.5465545654297
nll mean: 131.1730499267578 	 kl mean: 8.397895812988281 	 loss mean: 139.57093811035156


                                              
 21%|██        | 8/38 [00:05<00:15,  1.89it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.87it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.79it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 22.32it/s][A

nll mean: 131.04428100585938 	 kl mean: 8.397895812988281 	 loss mean: 139.44216918945312
nll mean: 130.9053955078125 	 kl mean: 8.420339584350586 	 loss mean: 139.3257293701172
nll mean: 131.01760864257812 	 kl mean: 8.420339584350586 	 loss mean: 139.43795776367188
nll mean: 130.74070739746094 	 kl mean: 8.420339584350586 	 loss mean: 139.16104125976562
nll mean: 131.00018310546875 	 kl mean: 8.420339584350586 	 loss mean: 139.4205322265625


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 22.32it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.13it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.94it/s][A

nll mean: 130.50279235839844 	 kl mean: 8.420339584350586 	 loss mean: 138.92312622070312
nll mean: 130.6647186279297 	 kl mean: 8.420339584350586 	 loss mean: 139.08505249023438
nll mean: 131.25009155273438 	 kl mean: 8.420339584350586 	 loss mean: 139.67041015625
nll mean: 131.33311462402344 	 kl mean: 8.420339584350586 	 loss mean: 139.75344848632812
nll mean: 131.1464385986328 	 kl mean: 8.420339584350586 	 loss mean: 139.5667724609375


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
100%|██████████| 10/10 [00:00<00:00, 21.67it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
 30%|███       | 3/10 [00:00<00:00, 25.22it/s][A

nll mean: 131.33016967773438 	 kl mean: 8.420339584350586 	 loss mean: 139.75048828125
nll mean: 117.9050064086914 	 kl mean: 8.206375122070312 	 loss mean: 126.11137390136719
nll mean: 117.33085632324219 	 kl mean: 8.206375122070312 	 loss mean: 125.5372314453125
nll mean: 117.33203125 	 kl mean: 8.206375122070312 	 loss mean: 125.53842163085938
nll mean: 117.76263427734375 	 kl mean: 8.206375122070312 	 loss mean: 125.96900177001953


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
 30%|███       | 3/10 [00:00<00:00, 25.22it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.97it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.78it/s][A

nll mean: 117.34320068359375 	 kl mean: 8.206375122070312 	 loss mean: 125.54956817626953
nll mean: 117.47578430175781 	 kl mean: 8.206375122070312 	 loss mean: 125.68216705322266
nll mean: 117.80684661865234 	 kl mean: 8.206375122070312 	 loss mean: 126.01322937011719
nll mean: 117.62374877929688 	 kl mean: 8.206375122070312 	 loss mean: 125.83011627197266
nll mean: 116.96908569335938 	 kl mean: 8.206375122070312 	 loss mean: 125.17546844482422


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
100%|██████████| 10/10 [00:00<00:00, 24.67it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
 30%|███       | 3/10 [00:00<00:00, 21.16it/s][A

nll mean: 117.38957214355469 	 kl mean: 8.206375122070312 	 loss mean: 125.59593963623047
nll mean: 140.95443725585938 	 kl mean: 8.185078620910645 	 loss mean: 149.1395263671875
nll mean: 141.0703125 	 kl mean: 8.185078620910645 	 loss mean: 149.25540161132812
nll mean: 140.61839294433594 	 kl mean: 8.185078620910645 	 loss mean: 148.803466796875
nll mean: 141.51644897460938 	 kl mean: 8.185078620910645 	 loss mean: 149.7015380859375


                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
 30%|███       | 3/10 [00:00<00:00, 21.16it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.19it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.15it/s][A

nll mean: 140.87319946289062 	 kl mean: 8.185078620910645 	 loss mean: 149.05828857421875
nll mean: 141.02130126953125 	 kl mean: 8.185078620910645 	 loss mean: 149.2063751220703
nll mean: 141.19061279296875 	 kl mean: 8.185078620910645 	 loss mean: 149.37570190429688
nll mean: 140.65484619140625 	 kl mean: 8.185078620910645 	 loss mean: 148.8399200439453
nll mean: 141.09432983398438 	 kl mean: 8.185078620910645 	 loss mean: 149.27938842773438


                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
100%|██████████| 10/10 [00:00<00:00, 21.22it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.38it/s][A

nll mean: 140.62496948242188 	 kl mean: 8.185078620910645 	 loss mean: 148.81005859375
nll mean: 120.22721862792969 	 kl mean: 8.487061500549316 	 loss mean: 128.7142791748047
nll mean: 119.9439468383789 	 kl mean: 8.487061500549316 	 loss mean: 128.43099975585938


                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
 20%|██        | 2/10 [00:00<00:00, 12.38it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
 40%|████      | 4/10 [00:00<00:00, 12.36it/s][A

nll mean: 119.95228576660156 	 kl mean: 8.487061500549316 	 loss mean: 128.43934631347656
nll mean: 119.8465576171875 	 kl mean: 8.487061500549316 	 loss mean: 128.3336181640625
nll mean: 119.85613250732422 	 kl mean: 8.487061500549316 	 loss mean: 128.34320068359375


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
 40%|████      | 4/10 [00:00<00:00, 12.36it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.32it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.40it/s][A

nll mean: 119.70272827148438 	 kl mean: 8.487061500549316 	 loss mean: 128.18978881835938
nll mean: 120.02326965332031 	 kl mean: 8.487061500549316 	 loss mean: 128.5103302001953
nll mean: 120.02336120605469 	 kl mean: 8.487061500549316 	 loss mean: 128.51043701171875


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.40it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.42it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.641845703125 	 kl mean: 8.487061500549316 	 loss mean: 129.12890625
nll mean: 119.76251220703125 	 kl mean: 8.487061500549316 	 loss mean: 128.24957275390625
nll mean: 160.75607299804688 	 kl mean: 8.778806686401367 	 loss mean: 169.53488159179688


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
 20%|██        | 2/10 [00:00<00:00, 10.02it/s][A
                                               [A
[A                                           

nll mean: 160.71343994140625 	 kl mean: 8.778806686401367 	 loss mean: 169.49224853515625
nll mean: 161.16067504882812 	 kl mean: 8.778806686401367 	 loss mean: 169.93948364257812


 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
 30%|███       | 3/10 [00:00<00:00,  9.99it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.06it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.13it/s][A

nll mean: 161.02957153320312 	 kl mean: 8.778806686401367 	 loss mean: 169.80838012695312
nll mean: 161.78564453125 	 kl mean: 8.778806686401367 	 loss mean: 170.564453125
nll mean: 161.1767120361328 	 kl mean: 8.778806686401367 	 loss mean: 169.95553588867188
nll mean: 161.1980743408203 	 kl mean: 8.778806686401367 	 loss mean: 169.97686767578125


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.13it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 90%|█████████ | 9/10 [00:00<00:00, 10.10it/s][A

nll mean: 161.30364990234375 	 kl mean: 8.778806686401367 	 loss mean: 170.08245849609375
nll mean: 160.82412719726562 	 kl mean: 8.778806686401367 	 loss mean: 169.60293579101562
nll mean: 161.45645141601562 	 kl mean: 8.778806686401367 	 loss mean: 170.23524475097656


100%|██████████| 10/10 [00:00<00:00, 10.11it/s]
 37%|███▋      | 14/38 [00:08<00:17,  1.41it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.41it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.41it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.41it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.41it/s]
 20%|██        | 2/10 [00:00<00:00, 18.08it/s][A
 40%|████      | 4/10 [00:00<00:00, 18.00it/s][A

nll mean: 134.62921142578125 	 kl mean: 8.041875839233398 	 loss mean: 142.67108154296875
nll mean: 134.96421813964844 	 kl mean: 8.041875839233398 	 loss mean: 143.00608825683594
nll mean: 134.57244873046875 	 kl mean: 8.041875839233398 	 loss mean: 142.61431884765625
nll mean: 134.087158203125 	 kl mean: 8.041875839233398 	 loss mean: 142.12904357910156


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.41it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.41it/s]
 40%|████      | 4/10 [00:00<00:00, 18.00it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.41it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.41it/s]
 60%|██████    | 6/10 [00:00<00:00, 17.89it/s][A
 80%|████████  | 8/10 [00:00<00:00, 17.83it/s][A

nll mean: 134.854248046875 	 kl mean: 8.041875839233398 	 loss mean: 142.8961181640625
nll mean: 134.98158264160156 	 kl mean: 8.041875839233398 	 loss mean: 143.02346801757812
nll mean: 134.463623046875 	 kl mean: 8.041875839233398 	 loss mean: 142.5054931640625
nll mean: 134.52459716796875 	 kl mean: 8.041875839233398 	 loss mean: 142.56646728515625


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.41it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.41it/s]
 80%|████████  | 8/10 [00:00<00:00, 17.83it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.83it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 134.56060791015625 	 kl mean: 8.041875839233398 	 loss mean: 142.60247802734375
nll mean: 134.75787353515625 	 kl mean: 8.041875839233398 	 loss mean: 142.79974365234375
nll mean: 141.98255920410156 	 kl mean: 8.394887924194336 	 loss mean: 150.37744140625


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 20%|██        | 2/10 [00:00<00:00, 10.80it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.81it/s][A

nll mean: 142.53167724609375 	 kl mean: 8.394887924194336 	 loss mean: 150.92657470703125
nll mean: 142.32559204101562 	 kl mean: 8.394887924194336 	 loss mean: 150.72048950195312
nll mean: 142.236328125 	 kl mean: 8.394887924194336 	 loss mean: 150.6312255859375


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 40%|████      | 4/10 [00:00<00:00, 10.81it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.82it/s][A

nll mean: 142.57662963867188 	 kl mean: 8.394887924194336 	 loss mean: 150.9715118408203
nll mean: 142.4931640625 	 kl mean: 8.394887924194336 	 loss mean: 150.88803100585938
nll mean: 142.21701049804688 	 kl mean: 8.394887924194336 	 loss mean: 150.61190795898438


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.82it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.79it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.77it/s][A
 42%|████▏     | 16/38 [00:09<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 142.4741668701172 	 kl mean: 8.394887924194336 	 loss mean: 150.86904907226562
nll mean: 142.22872924804688 	 kl mean: 8.394887924194336 	 loss mean: 150.6236114501953
nll mean: 142.15115356445312 	 kl mean: 8.394887924194336 	 loss mean: 150.54605102539062


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 24.73it/s][A

nll mean: 143.51206970214844 	 kl mean: 7.892433166503906 	 loss mean: 151.40451049804688
nll mean: 143.6522216796875 	 kl mean: 7.892433166503906 	 loss mean: 151.544677734375
nll mean: 144.00262451171875 	 kl mean: 7.892433166503906 	 loss mean: 151.89505004882812
nll mean: 143.67306518554688 	 kl mean: 7.892433166503906 	 loss mean: 151.56549072265625
nll mean: 144.14004516601562 	 kl mean: 7.892433166503906 	 loss mean: 152.032470703125


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 24.73it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.55it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
100%|██████████| 10/10 [00:00<00:00, 23.98it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 144.19265747070312 	 kl mean: 7.892433166503906 	 loss mean: 152.0850830078125
nll mean: 143.4174346923828 	 kl mean: 7.892433166503906 	 loss mean: 151.30987548828125
nll mean: 143.99949645996094 	 kl mean: 7.892433166503906 	 loss mean: 151.89193725585938
nll mean: 143.6192169189453 	 kl mean: 7.892433166503906 	 loss mean: 151.51165771484375
nll mean: 143.48065185546875 	 kl mean: 7.892433166503906 	 loss mean: 151.37310791015625


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 25.03it/s][A

nll mean: 132.12539672851562 	 kl mean: 8.257061958312988 	 loss mean: 140.38247680664062
nll mean: 132.2952423095703 	 kl mean: 8.257061958312988 	 loss mean: 140.55230712890625
nll mean: 132.43548583984375 	 kl mean: 8.257061958312988 	 loss mean: 140.6925506591797
nll mean: 132.2950439453125 	 kl mean: 8.257061958312988 	 loss mean: 140.55209350585938
nll mean: 132.890869140625 	 kl mean: 8.257061958312988 	 loss mean: 141.14793395996094


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 25.03it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.94it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
100%|██████████| 10/10 [00:00<00:00, 24.75it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 132.3592529296875 	 kl mean: 8.257061958312988 	 loss mean: 140.61631774902344
nll mean: 132.453857421875 	 kl mean: 8.257061958312988 	 loss mean: 140.71090698242188
nll mean: 132.31771850585938 	 kl mean: 8.257061958312988 	 loss mean: 140.57479858398438
nll mean: 132.1477813720703 	 kl mean: 8.257061958312988 	 loss mean: 140.40484619140625
nll mean: 132.40805053710938 	 kl mean: 8.257061958312988 	 loss mean: 140.6651153564453


                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.74it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s]
 20%|██        | 2/10 [00:00<00:00, 12.52it/s][A

nll mean: 130.55526733398438 	 kl mean: 8.66995620727539 	 loss mean: 139.2252197265625
nll mean: 130.06829833984375 	 kl mean: 8.66995620727539 	 loss mean: 138.73825073242188
nll mean: 129.87001037597656 	 kl mean: 8.66995620727539 	 loss mean: 138.5399627685547


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s]
 20%|██        | 2/10 [00:00<00:00, 12.52it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s]
 40%|████      | 4/10 [00:00<00:00, 12.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.59it/s][A

nll mean: 130.32785034179688 	 kl mean: 8.66995620727539 	 loss mean: 138.99781799316406
nll mean: 130.07159423828125 	 kl mean: 8.66995620727539 	 loss mean: 138.74154663085938
nll mean: 130.03662109375 	 kl mean: 8.66995620727539 	 loss mean: 138.70657348632812


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.59it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.59it/s][A

nll mean: 130.02684020996094 	 kl mean: 8.66995620727539 	 loss mean: 138.69679260253906
nll mean: 130.42318725585938 	 kl mean: 8.66995620727539 	 loss mean: 139.0931396484375
nll mean: 130.07861328125 	 kl mean: 8.66995620727539 	 loss mean: 138.74856567382812


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.59it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.56it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.73it/s][A

nll mean: 129.3554229736328 	 kl mean: 8.66995620727539 	 loss mean: 138.025390625
nll mean: 148.2904052734375 	 kl mean: 8.257479667663574 	 loss mean: 156.54788208007812
nll mean: 148.68577575683594 	 kl mean: 8.257479667663574 	 loss mean: 156.9432373046875


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 12.73it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 40%|████      | 4/10 [00:00<00:00, 12.73it/s][A

nll mean: 147.79928588867188 	 kl mean: 8.257479667663574 	 loss mean: 156.05679321289062
nll mean: 148.27804565429688 	 kl mean: 8.257479667663574 	 loss mean: 156.53550720214844
nll mean: 148.68765258789062 	 kl mean: 8.257479667663574 	 loss mean: 156.9451141357422


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 40%|████      | 4/10 [00:00<00:00, 12.73it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.74it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.74it/s][A

nll mean: 148.68875122070312 	 kl mean: 8.257479667663574 	 loss mean: 156.94622802734375
nll mean: 147.91795349121094 	 kl mean: 8.257479667663574 	 loss mean: 156.17543029785156
nll mean: 148.57464599609375 	 kl mean: 8.257479667663574 	 loss mean: 156.83212280273438


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.74it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.69it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 148.69589233398438 	 kl mean: 8.257479667663574 	 loss mean: 156.953369140625
nll mean: 148.83180236816406 	 kl mean: 8.257479667663574 	 loss mean: 157.0892791748047
nll mean: 155.56640625 	 kl mean: 8.263922691345215 	 loss mean: 163.830322265625


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 12.72it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.81it/s][A

nll mean: 155.42593383789062 	 kl mean: 8.263922691345215 	 loss mean: 163.68984985351562
nll mean: 156.14480590820312 	 kl mean: 8.263922691345215 	 loss mean: 164.40872192382812
nll mean: 155.5760498046875 	 kl mean: 8.263922691345215 	 loss mean: 163.8399658203125


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 12.81it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.73it/s][A

nll mean: 155.45159912109375 	 kl mean: 8.263922691345215 	 loss mean: 163.71551513671875
nll mean: 155.3670654296875 	 kl mean: 8.263922691345215 	 loss mean: 163.6309814453125
nll mean: 156.0257568359375 	 kl mean: 8.263922691345215 	 loss mean: 164.2896728515625


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.73it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.46it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.67it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.69it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 155.2890625 	 kl mean: 8.263922691345215 	 loss mean: 163.552978515625
nll mean: 155.7772216796875 	 kl mean: 8.263922691345215 	 loss mean: 164.0411376953125
nll mean: 156.01315307617188 	 kl mean: 8.263922691345215 	 loss mean: 164.27706909179688


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 10.29it/s][A

nll mean: 117.81245422363281 	 kl mean: 8.514453887939453 	 loss mean: 126.32691192626953
nll mean: 117.46443176269531 	 kl mean: 8.514453887939453 	 loss mean: 125.9788818359375
nll mean: 117.6136703491211 	 kl mean: 8.514453887939453 	 loss mean: 126.12812805175781


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 10.29it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 40%|████      | 4/10 [00:00<00:00, 10.29it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.26it/s][A

nll mean: 117.67825317382812 	 kl mean: 8.514453887939453 	 loss mean: 126.19270324707031
nll mean: 116.79191589355469 	 kl mean: 8.514453887939453 	 loss mean: 125.3063735961914
nll mean: 117.17623138427734 	 kl mean: 8.514453887939453 	 loss mean: 125.690673828125


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.26it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.24it/s][A

nll mean: 117.5704345703125 	 kl mean: 8.514453887939453 	 loss mean: 126.08488464355469
nll mean: 117.71817016601562 	 kl mean: 8.514453887939453 	 loss mean: 126.23262786865234
nll mean: 118.47090148925781 	 kl mean: 8.514453887939453 	 loss mean: 126.98535919189453


                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.24it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.24it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
 40%|████      | 4/10 [00:00<00:00, 33.18it/s][A

nll mean: 117.57926177978516 	 kl mean: 8.514453887939453 	 loss mean: 126.09371948242188
nll mean: 106.79693603515625 	 kl mean: 7.458414554595947 	 loss mean: 114.2553482055664
nll mean: 106.24984741210938 	 kl mean: 7.458414554595947 	 loss mean: 113.70826721191406
nll mean: 106.28861999511719 	 kl mean: 7.458414554595947 	 loss mean: 113.74703216552734
nll mean: 106.3034439086914 	 kl mean: 7.458414554595947 	 loss mean: 113.76185607910156
nll mean: 106.16970825195312 	 kl mean: 7.458414554595947 	 loss mean: 113.62811279296875
nll mean: 106.2183609008789 	 kl mean: 7.458414554595947 	 loss mean: 113.67677307128906


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
 40%|████      | 4/10 [00:00<00:00, 33.18it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
100%|██████████| 10/10 [00:00<00:00, 32.90it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 105.93122100830078 	 kl mean: 7.458414554595947 	 loss mean: 113.38963317871094
nll mean: 106.08504486083984 	 kl mean: 7.458414554595947 	 loss mean: 113.54346466064453
nll mean: 106.05977630615234 	 kl mean: 7.458414554595947 	 loss mean: 113.5181884765625
nll mean: 106.77940368652344 	 kl mean: 7.458414554595947 	 loss mean: 114.23780822753906
nll mean: 157.1019287109375 	 kl mean: 8.414207458496094 	 loss mean: 165.51612854003906


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
 20%|██        | 2/10 [00:00<00:00, 14.53it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.60it/s][A

nll mean: 157.0528564453125 	 kl mean: 8.414207458496094 	 loss mean: 165.46707153320312
nll mean: 157.95474243164062 	 kl mean: 8.414207458496094 	 loss mean: 166.36895751953125
nll mean: 157.18479919433594 	 kl mean: 8.414207458496094 	 loss mean: 165.59901428222656


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
 40%|████      | 4/10 [00:00<00:00, 14.60it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.65it/s][A

nll mean: 157.59866333007812 	 kl mean: 8.414207458496094 	 loss mean: 166.01287841796875
nll mean: 157.17039489746094 	 kl mean: 8.414207458496094 	 loss mean: 165.5845947265625
nll mean: 157.69078063964844 	 kl mean: 8.414207458496094 	 loss mean: 166.10498046875


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.65it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.58it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.64it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 157.204833984375 	 kl mean: 8.414207458496094 	 loss mean: 165.61904907226562
nll mean: 157.19549560546875 	 kl mean: 8.414207458496094 	 loss mean: 165.60968017578125
nll mean: 156.84815979003906 	 kl mean: 8.414207458496094 	 loss mean: 165.26235961914062
nll mean: 120.6791763305664 	 kl mean: 8.921710968017578 	 loss mean: 129.60089111328125


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 22.09it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.89it/s][A

nll mean: 121.46672058105469 	 kl mean: 8.921710968017578 	 loss mean: 130.388427734375
nll mean: 120.95304107666016 	 kl mean: 8.921710968017578 	 loss mean: 129.874755859375
nll mean: 120.87161254882812 	 kl mean: 8.921710968017578 	 loss mean: 129.7933349609375
nll mean: 120.85675811767578 	 kl mean: 8.921710968017578 	 loss mean: 129.77845764160156
nll mean: 120.91917419433594 	 kl mean: 8.921710968017578 	 loss mean: 129.84088134765625


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.89it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 21.55it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.8802490234375 	 kl mean: 8.921710968017578 	 loss mean: 129.8019561767578
nll mean: 120.99161529541016 	 kl mean: 8.921710968017578 	 loss mean: 129.913330078125
nll mean: 121.10404205322266 	 kl mean: 8.921710968017578 	 loss mean: 130.0257568359375
nll mean: 121.18379211425781 	 kl mean: 8.921710968017578 	 loss mean: 130.10549926757812


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 14.65it/s][A

nll mean: 113.70805358886719 	 kl mean: 7.517951011657715 	 loss mean: 121.22599792480469
nll mean: 114.3175048828125 	 kl mean: 7.517951011657715 	 loss mean: 121.83546447753906
nll mean: 114.23270416259766 	 kl mean: 7.517951011657715 	 loss mean: 121.75065612792969


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 14.65it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 40%|████      | 4/10 [00:00<00:00, 14.72it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.72it/s][A

nll mean: 114.13574981689453 	 kl mean: 7.517951011657715 	 loss mean: 121.65371704101562
nll mean: 114.48585510253906 	 kl mean: 7.517951011657715 	 loss mean: 122.00379943847656
nll mean: 114.2410659790039 	 kl mean: 7.517951011657715 	 loss mean: 121.75901794433594


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.72it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.70it/s][A

nll mean: 114.54338073730469 	 kl mean: 7.517951011657715 	 loss mean: 122.06134033203125
nll mean: 114.07699584960938 	 kl mean: 7.517951011657715 	 loss mean: 121.5949478149414
nll mean: 114.45095825195312 	 kl mean: 7.517951011657715 	 loss mean: 121.96891784667969


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.70it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.73it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00, 23.43it/s][A

nll mean: 113.72602844238281 	 kl mean: 7.517951011657715 	 loss mean: 121.24398803710938
nll mean: 82.49125671386719 	 kl mean: 7.545131683349609 	 loss mean: 90.03638458251953
nll mean: 82.39402770996094 	 kl mean: 7.545131683349609 	 loss mean: 89.93915557861328
nll mean: 82.71110534667969 	 kl mean: 7.545131683349609 	 loss mean: 90.25623321533203
nll mean: 82.10401916503906 	 kl mean: 7.545131683349609 	 loss mean: 89.64915466308594


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00, 23.43it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.91it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.19it/s][A

nll mean: 82.44379425048828 	 kl mean: 7.545131683349609 	 loss mean: 89.98892974853516
nll mean: 82.36766052246094 	 kl mean: 7.545131683349609 	 loss mean: 89.91278076171875
nll mean: 82.36058807373047 	 kl mean: 7.545131683349609 	 loss mean: 89.90571594238281
nll mean: 82.19569396972656 	 kl mean: 7.545131683349609 	 loss mean: 89.7408218383789
nll mean: 82.14198303222656 	 kl mean: 7.545131683349609 	 loss mean: 89.68711853027344


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
100%|██████████| 10/10 [00:00<00:00, 22.10it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.40it/s][A

nll mean: 82.31282043457031 	 kl mean: 7.545131683349609 	 loss mean: 89.85795593261719
nll mean: 109.37674713134766 	 kl mean: 7.649331092834473 	 loss mean: 117.02607727050781
nll mean: 109.50881958007812 	 kl mean: 7.649331092834473 	 loss mean: 117.15815734863281
nll mean: 109.005859375 	 kl mean: 7.649331092834473 	 loss mean: 116.65518951416016
nll mean: 108.60781860351562 	 kl mean: 7.649331092834473 	 loss mean: 116.25714874267578


                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.40it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.60it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.65it/s][A

nll mean: 108.79440307617188 	 kl mean: 7.649331092834473 	 loss mean: 116.44374084472656
nll mean: 108.90955352783203 	 kl mean: 7.649331092834473 	 loss mean: 116.55888366699219
nll mean: 109.61856079101562 	 kl mean: 7.649331092834473 	 loss mean: 117.26789855957031
nll mean: 109.44422912597656 	 kl mean: 7.649331092834473 	 loss mean: 117.09356689453125
nll mean: 108.88784790039062 	 kl mean: 7.649331092834473 	 loss mean: 116.53717041015625


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
100%|██████████| 10/10 [00:00<00:00, 21.77it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.31it/s][A

nll mean: 109.48037719726562 	 kl mean: 7.649331092834473 	 loss mean: 117.12971496582031
nll mean: 120.12489318847656 	 kl mean: 8.310070037841797 	 loss mean: 128.43496704101562
nll mean: 119.66026306152344 	 kl mean: 8.310070037841797 	 loss mean: 127.9703369140625


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 20%|██        | 2/10 [00:00<00:00, 12.31it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 40%|████      | 4/10 [00:00<00:00, 12.45it/s][A

nll mean: 120.21713256835938 	 kl mean: 8.310070037841797 	 loss mean: 128.52719116210938
nll mean: 119.82145690917969 	 kl mean: 8.310070037841797 	 loss mean: 128.13153076171875
nll mean: 120.01165771484375 	 kl mean: 8.310070037841797 	 loss mean: 128.3217315673828


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 40%|████      | 4/10 [00:00<00:00, 12.45it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.54it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.45it/s][A

nll mean: 119.86534118652344 	 kl mean: 8.310070037841797 	 loss mean: 128.1754150390625
nll mean: 119.63506317138672 	 kl mean: 8.310070037841797 	 loss mean: 127.94512939453125
nll mean: 120.01023864746094 	 kl mean: 8.310070037841797 	 loss mean: 128.3203125


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.85it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.45it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.52it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.46977996826172 	 kl mean: 8.310070037841797 	 loss mean: 128.77984619140625
nll mean: 119.9259033203125 	 kl mean: 8.310070037841797 	 loss mean: 128.2359619140625
nll mean: 61.85103988647461 	 kl mean: 8.184444427490234 	 loss mean: 70.03548431396484


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
 20%|██        | 2/10 [00:00<00:00, 10.19it/s][A


nll mean: 61.55679702758789 	 kl mean: 8.184444427490234 	 loss mean: 69.74124145507812
nll mean: 62.18280029296875 	 kl mean: 8.184444427490234 	 loss mean: 70.36724853515625
nll mean: 61.778141021728516 	 kl mean: 8.184444427490234 	 loss mean: 69.96258544921875


                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
 40%|████      | 4/10 [00:00<00:00, 10.16it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.22it/s][A

nll mean: 60.616058349609375 	 kl mean: 8.184444427490234 	 loss mean: 68.80049896240234
nll mean: 62.34703063964844 	 kl mean: 8.184444427490234 	 loss mean: 70.53147888183594
nll mean: 61.772701263427734 	 kl mean: 8.184444427490234 	 loss mean: 69.95713806152344


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.22it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.62it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.20it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.19it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]

nll mean: 61.61138916015625 	 kl mean: 8.184444427490234 	 loss mean: 69.79583740234375
nll mean: 62.3702507019043 	 kl mean: 8.184444427490234 	 loss mean: 70.55469512939453
nll mean: 61.36379623413086 	 kl mean: 8.184444427490234 	 loss mean: 69.54823303222656



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 13.40it/s][A

nll mean: 104.40780639648438 	 kl mean: 8.172574996948242 	 loss mean: 112.58038330078125
nll mean: 104.98953247070312 	 kl mean: 8.172574996948242 	 loss mean: 113.162109375
nll mean: 104.82772064208984 	 kl mean: 8.172574996948242 	 loss mean: 113.00028991699219


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 13.40it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 40%|████      | 4/10 [00:00<00:00, 13.17it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.03it/s][A

nll mean: 104.13710021972656 	 kl mean: 8.172574996948242 	 loss mean: 112.30967712402344
nll mean: 104.20967102050781 	 kl mean: 8.172574996948242 	 loss mean: 112.38224792480469
nll mean: 104.47628784179688 	 kl mean: 8.172574996948242 	 loss mean: 112.64886474609375


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.03it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.02it/s][A

nll mean: 104.68150329589844 	 kl mean: 8.172574996948242 	 loss mean: 112.85408020019531
nll mean: 104.32119750976562 	 kl mean: 8.172574996948242 	 loss mean: 112.4937744140625
nll mean: 105.08419036865234 	 kl mean: 8.172574996948242 	 loss mean: 113.25677490234375


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.02it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.85it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.34it/s]
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.34it/s]
                                               

nll mean: 104.72222137451172 	 kl mean: 8.172574996948242 	 loss mean: 112.8947982788086
nll mean: 137.84347534179688 	 kl mean: 8.963164329528809 	 loss mean: 146.80665588378906



 82%|████████▏ | 31/38 [00:19<00:05,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 20%|██        | 2/10 [00:00<00:00, 10.18it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.11it/s][A

nll mean: 138.003662109375 	 kl mean: 8.963164329528809 	 loss mean: 146.96682739257812
nll mean: 138.46937561035156 	 kl mean: 8.963164329528809 	 loss mean: 147.4325408935547


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 10.11it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 40%|████      | 4/10 [00:00<00:00, 10.02it/s][A


nll mean: 138.33706665039062 	 kl mean: 8.963164329528809 	 loss mean: 147.30023193359375
nll mean: 137.71798706054688 	 kl mean: 8.963164329528809 	 loss mean: 146.68115234375
nll mean: 138.25656127929688 	 kl mean: 8.963164329528809 	 loss mean: 147.2197265625


                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.04it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.92it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.93it/s][A

nll mean: 138.91358947753906 	 kl mean: 8.963164329528809 	 loss mean: 147.87673950195312
nll mean: 138.42347717285156 	 kl mean: 8.963164329528809 	 loss mean: 147.3866424560547


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.93it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.87it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.95it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 138.07748413085938 	 kl mean: 8.963164329528809 	 loss mean: 147.0406494140625
nll mean: 138.15261840820312 	 kl mean: 8.963164329528809 	 loss mean: 147.11578369140625
nll mean: 63.65019989013672 	 kl mean: 6.7184295654296875 	 loss mean: 70.3686294555664
nll mean: 63.56491470336914 	 kl mean: 6.7184295654296875 	 loss mean: 70.28334045410156


                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               [A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
 30%|███       | 3/10 [00:00<00:00, 26.16it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.94it/s][A

nll mean: 63.32454299926758 	 kl mean: 6.7184295654296875 	 loss mean: 70.04297637939453
nll mean: 63.62090301513672 	 kl mean: 6.7184295654296875 	 loss mean: 70.33934020996094
nll mean: 63.898162841796875 	 kl mean: 6.7184295654296875 	 loss mean: 70.61659240722656
nll mean: 63.58045196533203 	 kl mean: 6.7184295654296875 	 loss mean: 70.29888153076172
nll mean: 63.656219482421875 	 kl mean: 6.7184295654296875 	 loss mean: 70.37464904785156
nll mean: 63.314598083496094 	 kl mean: 6.7184295654296875 	 loss mean: 70.03302001953125


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.94it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s]
100%|██████████| 10/10 [00:00<00:00, 25.45it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 21.59it/s][A

nll mean: 63.93086242675781 	 kl mean: 6.7184295654296875 	 loss mean: 70.6492919921875
nll mean: 63.54484939575195 	 kl mean: 6.7184295654296875 	 loss mean: 70.26327514648438
nll mean: 118.65119934082031 	 kl mean: 7.656718730926514 	 loss mean: 126.30791473388672
nll mean: 118.41592407226562 	 kl mean: 7.656718730926514 	 loss mean: 126.07263946533203
nll mean: 118.49626159667969 	 kl mean: 7.656718730926514 	 loss mean: 126.1529769897461


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 30%|███       | 3/10 [00:00<00:00, 21.59it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.57it/s][A

nll mean: 118.62809753417969 	 kl mean: 7.656718730926514 	 loss mean: 126.2848129272461
nll mean: 119.02145385742188 	 kl mean: 7.656718730926514 	 loss mean: 126.67817687988281
nll mean: 118.104736328125 	 kl mean: 7.656718730926514 	 loss mean: 125.76145935058594
nll mean: 118.03765869140625 	 kl mean: 7.656718730926514 	 loss mean: 125.69438171386719
nll mean: 118.61570739746094 	 kl mean: 7.656718730926514 	 loss mean: 126.27242279052734


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.57it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
100%|██████████| 10/10 [00:00<00:00, 21.56it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.60it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.70367431640625 	 kl mean: 7.656718730926514 	 loss mean: 126.36038970947266
nll mean: 118.82861328125 	 kl mean: 7.656718730926514 	 loss mean: 126.48533630371094
nll mean: 119.41230010986328 	 kl mean: 8.20846939086914 	 loss mean: 127.62077331542969


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.60it/s]
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.60it/s]
 20%|██        | 2/10 [00:00<00:00, 12.57it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.69it/s][A

nll mean: 119.14570617675781 	 kl mean: 8.20846939086914 	 loss mean: 127.35417938232422
nll mean: 119.03779602050781 	 kl mean: 8.20846939086914 	 loss mean: 127.24626922607422
nll mean: 119.53343200683594 	 kl mean: 8.20846939086914 	 loss mean: 127.74189758300781


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
 40%|████      | 4/10 [00:00<00:00, 12.69it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.65it/s][A

nll mean: 118.69629669189453 	 kl mean: 8.20846939086914 	 loss mean: 126.9047622680664
nll mean: 118.8458480834961 	 kl mean: 8.20846939086914 	 loss mean: 127.0543212890625
nll mean: 118.8661117553711 	 kl mean: 8.20846939086914 	 loss mean: 127.0745849609375


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.65it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.60it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.63it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.64it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.64501953125 	 kl mean: 8.20846939086914 	 loss mean: 126.8534927368164
nll mean: 118.71536254882812 	 kl mean: 8.20846939086914 	 loss mean: 126.92381286621094
nll mean: 118.89012145996094 	 kl mean: 8.20846939086914 	 loss mean: 127.09858703613281


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 10.70it/s][A

nll mean: 113.64218139648438 	 kl mean: 8.11929702758789 	 loss mean: 121.76148223876953
nll mean: 113.16050720214844 	 kl mean: 8.11929702758789 	 loss mean: 121.27980041503906
nll mean: 113.16375732421875 	 kl mean: 8.11929702758789 	 loss mean: 121.28305053710938


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 10.70it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 10.67it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.65it/s][A

nll mean: 113.00822448730469 	 kl mean: 8.11929702758789 	 loss mean: 121.12751770019531
nll mean: 113.50979614257812 	 kl mean: 8.11929702758789 	 loss mean: 121.62909698486328
nll mean: 113.91059875488281 	 kl mean: 8.11929702758789 	 loss mean: 122.02989196777344


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.65it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.58it/s][A

nll mean: 113.76359558105469 	 kl mean: 8.11929702758789 	 loss mean: 121.88288879394531
nll mean: 113.54863739013672 	 kl mean: 8.11929702758789 	 loss mean: 121.66793823242188
nll mean: 113.26713562011719 	 kl mean: 8.11929702758789 	 loss mean: 121.38644409179688


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.58it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.55it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00, 22.14it/s][A

nll mean: 113.43453979492188 	 kl mean: 8.11929702758789 	 loss mean: 121.55384063720703
nll mean: 111.09841918945312 	 kl mean: 8.100685119628906 	 loss mean: 119.19910430908203
nll mean: 110.89414978027344 	 kl mean: 8.100685119628906 	 loss mean: 118.99482727050781
nll mean: 111.17140197753906 	 kl mean: 8.100685119628906 	 loss mean: 119.27207946777344
nll mean: 111.35798645019531 	 kl mean: 8.100685119628906 	 loss mean: 119.45866394042969


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00, 22.14it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
 50%|█████     | 5/10 [00:00<00:00, 21.27it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
 80%|████████  | 8/10 [00:00<00:00, 21.18it/s][A

nll mean: 111.43700408935547 	 kl mean: 8.100685119628906 	 loss mean: 119.53768920898438
nll mean: 110.9571533203125 	 kl mean: 8.100685119628906 	 loss mean: 119.05783081054688
nll mean: 111.0567626953125 	 kl mean: 8.100685119628906 	 loss mean: 119.1574478149414
nll mean: 111.25352478027344 	 kl mean: 8.100685119628906 	 loss mean: 119.35420227050781
nll mean: 111.17901611328125 	 kl mean: 8.100685119628906 	 loss mean: 119.27969360351562


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
100%|██████████| 10/10 [00:00<00:00, 20.97it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 30%|███       | 3/10 [00:00<00:00, 29.39it/s][A

nll mean: 111.21498107910156 	 kl mean: 8.100685119628906 	 loss mean: 119.31565856933594
nll mean: 85.50347900390625 	 kl mean: 8.018549919128418 	 loss mean: 93.52203369140625
nll mean: 85.20462799072266 	 kl mean: 8.018549919128418 	 loss mean: 93.22319030761719
nll mean: 85.16512298583984 	 kl mean: 8.018549919128418 	 loss mean: 93.18367767333984
nll mean: 85.64630126953125 	 kl mean: 8.018549919128418 	 loss mean: 93.66484069824219
nll mean: 85.09172821044922 	 kl mean: 8.018549919128418 	 loss mean: 93.11028289794922


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 30%|███       | 3/10 [00:00<00:00, 29.39it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 29.32it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
100%|██████████| 10/10 [00:00<00:00, 29.15it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.57it/s]


nll mean: 85.9432601928711 	 kl mean: 8.018549919128418 	 loss mean: 93.9618148803711
nll mean: 85.20427703857422 	 kl mean: 8.018549919128418 	 loss mean: 93.22282409667969
nll mean: 84.71805572509766 	 kl mean: 8.018549919128418 	 loss mean: 92.73660278320312
nll mean: 85.56256103515625 	 kl mean: 8.018549919128418 	 loss mean: 93.58111572265625
nll mean: 85.71084594726562 	 kl mean: 8.018549919128418 	 loss mean: 93.72941589355469
Approximate NLL:
tensor(121.0295, device='cuda:0')
Approximate KL:
tensor(8.1792, device='cuda:0')
Testing took 0:00:25.211279


  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .91it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .91it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 24.91it/s][A

nll mean: 109.23709869384766 	 kl mean: 8.866912841796875 	 loss mean: 118.10401153564453
nll mean: 109.06786346435547 	 kl mean: 8.866912841796875 	 loss mean: 117.93478393554688
nll mean: 109.27032470703125 	 kl mean: 8.866912841796875 	 loss mean: 118.1372299194336
nll mean: 109.46488189697266 	 kl mean: 8.866912841796875 	 loss mean: 118.33179473876953
nll mean: 109.01332092285156 	 kl mean: 8.866912841796875 	 loss mean: 117.88023376464844


                                      
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 24.91it/s][A
                                      .55it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .55it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .55it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 24.55it/s][A
                                      .21it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 23.94it/s][A
  3%|▎         | 1/38 [00:00<00:15,  2.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 108.57963562011719 	 kl mean: 8.866912841796875 	 loss mean: 117.44654846191406
nll mean: 109.47421264648438 	 kl mean: 8.866912841796875 	 loss mean: 118.34111785888672
nll mean: 108.9388427734375 	 kl mean: 8.866912841796875 	 loss mean: 117.80575561523438
nll mean: 108.93492126464844 	 kl mean: 8.866912841796875 	 loss mean: 117.80183410644531
nll mean: 108.71728515625 	 kl mean: 8.866912841796875 	 loss mean: 117.5842056274414


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.38it/s]
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.38it/s]
 20%|██        | 2/10 [00:00<00:00, 13.23it/s][A

nll mean: 124.73538208007812 	 kl mean: 8.632170677185059 	 loss mean: 133.3675537109375
nll mean: 125.35067749023438 	 kl mean: 8.632170677185059 	 loss mean: 133.98284912109375
nll mean: 125.71401977539062 	 kl mean: 8.632170677185059 	 loss mean: 134.34619140625


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.38it/s]
 20%|██        | 2/10 [00:00<00:00, 13.23it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.38it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.38it/s]
 40%|████      | 4/10 [00:00<00:00, 13.44it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.64it/s][A

nll mean: 125.21178436279297 	 kl mean: 8.632170677185059 	 loss mean: 133.84396362304688
nll mean: 125.07316589355469 	 kl mean: 8.632170677185059 	 loss mean: 133.705322265625
nll mean: 125.49542236328125 	 kl mean: 8.632170677185059 	 loss mean: 134.12759399414062


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.38it/s]
                                              [A
  3%|▎         | 1/38 [00:01<00:15,  2.38it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.64it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:15,  2.38it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.70it/s][A

nll mean: 126.02961730957031 	 kl mean: 8.632170677185059 	 loss mean: 134.6617889404297
nll mean: 126.16029357910156 	 kl mean: 8.632170677185059 	 loss mean: 134.79248046875
nll mean: 126.14558410644531 	 kl mean: 8.632170677185059 	 loss mean: 134.7777557373047


                                              
  3%|▎         | 1/38 [00:01<00:15,  2.38it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.70it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.81it/s][A
  5%|▌         | 2/38 [00:01<00:18,  1.95it/s]
                                              
  5%|▌         | 2/38 [00:01<00:18,  1.95it/s]
                                              
  5%|▌         | 2/38 [00:01<00:18,  1.95it/s]
                                              
  5%|▌         | 2/38 [00:01<00:18,  1.95it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:18,  1.95it/s]
 30%|███       | 3/10 [00:00<00:00, 24.37it/s][A

nll mean: 125.513916015625 	 kl mean: 8.632170677185059 	 loss mean: 134.14608764648438
nll mean: 99.75457763671875 	 kl mean: 7.898853778839111 	 loss mean: 107.65342712402344
nll mean: 99.77186584472656 	 kl mean: 7.898853778839111 	 loss mean: 107.67071533203125
nll mean: 99.41951751708984 	 kl mean: 7.898853778839111 	 loss mean: 107.31837463378906
nll mean: 99.37911987304688 	 kl mean: 7.898853778839111 	 loss mean: 107.27796936035156


                                              
  5%|▌         | 2/38 [00:01<00:18,  1.95it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:18,  1.95it/s]
 30%|███       | 3/10 [00:00<00:00, 24.37it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:18,  1.95it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:18,  1.95it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:18,  1.95it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.28it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.20it/s][A

nll mean: 99.27718353271484 	 kl mean: 7.898853778839111 	 loss mean: 107.176025390625
nll mean: 99.29044342041016 	 kl mean: 7.898853778839111 	 loss mean: 107.18929290771484
nll mean: 99.59937286376953 	 kl mean: 7.898853778839111 	 loss mean: 107.49822235107422
nll mean: 99.16436767578125 	 kl mean: 7.898853778839111 	 loss mean: 107.06321716308594
nll mean: 99.65794372558594 	 kl mean: 7.898853778839111 	 loss mean: 107.55679321289062


                                              
  5%|▌         | 2/38 [00:01<00:18,  1.95it/s]
100%|██████████| 10/10 [00:00<00:00, 24.12it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.07it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.07it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.07it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.57it/s][A

nll mean: 99.12614440917969 	 kl mean: 7.898853778839111 	 loss mean: 107.02500915527344
nll mean: 139.00445556640625 	 kl mean: 8.188821792602539 	 loss mean: 147.19326782226562
nll mean: 138.19554138183594 	 kl mean: 8.188821792602539 	 loss mean: 146.3843536376953


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.07it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.07it/s]
 20%|██        | 2/10 [00:00<00:00, 10.57it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.07it/s]
 40%|████      | 4/10 [00:00<00:00, 10.60it/s][A

nll mean: 137.99227905273438 	 kl mean: 8.188821792602539 	 loss mean: 146.18109130859375
nll mean: 138.56381225585938 	 kl mean: 8.188821792602539 	 loss mean: 146.7526397705078
nll mean: 138.90585327148438 	 kl mean: 8.188821792602539 	 loss mean: 147.09466552734375


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.07it/s]
 40%|████      | 4/10 [00:00<00:00, 10.60it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.07it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.07it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.62it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.63it/s][A

nll mean: 138.46685791015625 	 kl mean: 8.188821792602539 	 loss mean: 146.6556854248047
nll mean: 138.73226928710938 	 kl mean: 8.188821792602539 	 loss mean: 146.92108154296875
nll mean: 138.73072814941406 	 kl mean: 8.188821792602539 	 loss mean: 146.9195556640625


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.07it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.07it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.63it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.58it/s][A
 11%|█         | 4/38 [00:02<00:21,  1.61it/s]
                                              
 11%|█         | 4/38 [00:02<00:21,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 138.28712463378906 	 kl mean: 8.188821792602539 	 loss mean: 146.4759521484375
nll mean: 138.69479370117188 	 kl mean: 8.188821792602539 	 loss mean: 146.88360595703125
nll mean: 125.177001953125 	 kl mean: 8.058914184570312 	 loss mean: 133.2359161376953


                                              
 11%|█         | 4/38 [00:02<00:21,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:21,  1.61it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:21,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 14.54it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.38it/s][A

nll mean: 124.58651733398438 	 kl mean: 8.058914184570312 	 loss mean: 132.6454315185547
nll mean: 124.8108901977539 	 kl mean: 8.058914184570312 	 loss mean: 132.86981201171875
nll mean: 125.02945709228516 	 kl mean: 8.058914184570312 	 loss mean: 133.08837890625


                                              
 11%|█         | 4/38 [00:02<00:21,  1.61it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:21,  1.61it/s]
 40%|████      | 4/10 [00:00<00:00, 14.38it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:21,  1.61it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.11it/s][A

nll mean: 124.9755630493164 	 kl mean: 8.058914184570312 	 loss mean: 133.03448486328125
nll mean: 124.89335632324219 	 kl mean: 8.058914184570312 	 loss mean: 132.95225524902344
nll mean: 124.97586059570312 	 kl mean: 8.058914184570312 	 loss mean: 133.03477478027344


                                              
 11%|█         | 4/38 [00:03<00:21,  1.61it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.11it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:21,  1.61it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:21,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.06it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.95it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.98745727539062 	 kl mean: 8.058914184570312 	 loss mean: 133.04637145996094
nll mean: 124.55397033691406 	 kl mean: 8.058914184570312 	 loss mean: 132.61288452148438
nll mean: 125.37690734863281 	 kl mean: 8.058914184570312 	 loss mean: 133.43580627441406


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.54it/s][A

nll mean: 123.09266662597656 	 kl mean: 8.348633766174316 	 loss mean: 131.44131469726562
nll mean: 122.72232055664062 	 kl mean: 8.348633766174316 	 loss mean: 131.07095336914062
nll mean: 122.2005615234375 	 kl mean: 8.348633766174316 	 loss mean: 130.5491943359375


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.54it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 40%|████      | 4/10 [00:00<00:00, 14.44it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.41it/s][A

nll mean: 122.00282287597656 	 kl mean: 8.348633766174316 	 loss mean: 130.35147094726562
nll mean: 122.73876953125 	 kl mean: 8.348633766174316 	 loss mean: 131.08740234375
nll mean: 122.80389404296875 	 kl mean: 8.348633766174316 	 loss mean: 131.1525421142578


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.41it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.14it/s][A

nll mean: 122.49191284179688 	 kl mean: 8.348633766174316 	 loss mean: 130.84054565429688
nll mean: 122.74249267578125 	 kl mean: 8.348633766174316 	 loss mean: 131.09112548828125
nll mean: 122.85547637939453 	 kl mean: 8.348633766174316 	 loss mean: 131.2041015625


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.14it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.17it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.49it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.49it/s]
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.49it/s]
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.49it/s]
 30%|███       | 3/10 [00:00<00:00, 25.32it/s][A

nll mean: 122.63615417480469 	 kl mean: 8.348633766174316 	 loss mean: 130.98477172851562
nll mean: 132.49375915527344 	 kl mean: 8.525306701660156 	 loss mean: 141.01907348632812
nll mean: 132.5996856689453 	 kl mean: 8.525306701660156 	 loss mean: 141.125
nll mean: 132.58157348632812 	 kl mean: 8.525306701660156 	 loss mean: 141.10687255859375
nll mean: 132.47254943847656 	 kl mean: 8.525306701660156 	 loss mean: 140.9978485107422


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.49it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.49it/s]
 30%|███       | 3/10 [00:00<00:00, 25.32it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.49it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.49it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.49it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.19it/s][A
                                              [A

nll mean: 132.53201293945312 	 kl mean: 8.525306701660156 	 loss mean: 141.05731201171875
nll mean: 132.36634826660156 	 kl mean: 8.525306701660156 	 loss mean: 140.89166259765625
nll mean: 132.78732299804688 	 kl mean: 8.525306701660156 	 loss mean: 141.3126220703125
nll mean: 133.07736206054688 	 kl mean: 8.525306701660156 	 loss mean: 141.6026611328125
nll mean: 133.15444946289062 	 kl mean: 8.525306701660156 	 loss mean: 141.67977905273438



 16%|█▌        | 6/38 [00:04<00:21,  1.49it/s]
100%|██████████| 10/10 [00:00<00:00, 24.93it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              [A

nll mean: 132.63600158691406 	 kl mean: 8.525306701660156 	 loss mean: 141.16131591796875
nll mean: 105.33482360839844 	 kl mean: 8.203171730041504 	 loss mean: 113.53799438476562
nll mean: 105.27699279785156 	 kl mean: 8.203171730041504 	 loss mean: 113.48016357421875
nll mean: 105.045654296875 	 kl mean: 8.203171730041504 	 loss mean: 113.24882507324219
nll mean: 105.34298706054688 	 kl mean: 8.203171730041504 	 loss mean: 113.54615783691406



 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
 30%|███       | 3/10 [00:00<00:00, 25.20it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.16it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.93it/s][A

nll mean: 105.14532470703125 	 kl mean: 8.203171730041504 	 loss mean: 113.34849548339844
nll mean: 104.80079650878906 	 kl mean: 8.203171730041504 	 loss mean: 113.00396728515625
nll mean: 105.036376953125 	 kl mean: 8.203171730041504 	 loss mean: 113.23955535888672
nll mean: 105.40205383300781 	 kl mean: 8.203171730041504 	 loss mean: 113.60521697998047
nll mean: 105.39583587646484 	 kl mean: 8.203171730041504 	 loss mean: 113.59901428222656


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
100%|██████████| 10/10 [00:00<00:00, 24.85it/s][A
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A


nll mean: 105.2293701171875 	 kl mean: 8.203171730041504 	 loss mean: 113.43253326416016
nll mean: 130.80795288085938 	 kl mean: 8.628900527954102 	 loss mean: 139.43685913085938
nll mean: 131.60134887695312 	 kl mean: 8.628900527954102 	 loss mean: 140.23025512695312


 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 20%|██        | 2/10 [00:00<00:00, 14.98it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 40%|████      | 4/10 [00:00<00:00, 14.56it/s][A

nll mean: 130.7012176513672 	 kl mean: 8.628900527954102 	 loss mean: 139.33010864257812
nll mean: 131.13851928710938 	 kl mean: 8.628900527954102 	 loss mean: 139.76742553710938
nll mean: 130.78836059570312 	 kl mean: 8.628900527954102 	 loss mean: 139.41726684570312


                                              
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 40%|████      | 4/10 [00:00<00:00, 14.56it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.57it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.96it/s][A

nll mean: 131.1511688232422 	 kl mean: 8.628900527954102 	 loss mean: 139.78005981445312
nll mean: 130.87863159179688 	 kl mean: 8.628900527954102 	 loss mean: 139.50753784179688
nll mean: 131.5643310546875 	 kl mean: 8.628900527954102 	 loss mean: 140.1932373046875
nll mean: 130.8468475341797 	 kl mean: 8.628900527954102 	 loss mean: 139.4757537841797


                                              
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.96it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.73it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.31it/s][A

nll mean: 130.62435913085938 	 kl mean: 8.628900527954102 	 loss mean: 139.25326538085938
nll mean: 131.14111328125 	 kl mean: 8.451858520507812 	 loss mean: 139.59295654296875
nll mean: 131.01695251464844 	 kl mean: 8.451858520507812 	 loss mean: 139.46881103515625
nll mean: 130.05267333984375 	 kl mean: 8.451858520507812 	 loss mean: 138.50454711914062
nll mean: 130.63888549804688 	 kl mean: 8.451858520507812 	 loss mean: 139.09072875976562


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.31it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.43it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.35it/s][A

nll mean: 130.39170837402344 	 kl mean: 8.451858520507812 	 loss mean: 138.84356689453125
nll mean: 130.81332397460938 	 kl mean: 8.451858520507812 	 loss mean: 139.26519775390625
nll mean: 130.33351135253906 	 kl mean: 8.451858520507812 	 loss mean: 138.78536987304688
nll mean: 130.92724609375 	 kl mean: 8.451858520507812 	 loss mean: 139.3791046142578
nll mean: 130.60406494140625 	 kl mean: 8.451858520507812 	 loss mean: 139.055908203125


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
100%|██████████| 10/10 [00:00<00:00, 21.44it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
 30%|███       | 3/10 [00:00<00:00, 24.74it/s][A

nll mean: 131.11355590820312 	 kl mean: 8.451858520507812 	 loss mean: 139.56539916992188
nll mean: 118.19001770019531 	 kl mean: 8.431913375854492 	 loss mean: 126.62193298339844
nll mean: 117.9605712890625 	 kl mean: 8.431913375854492 	 loss mean: 126.39248657226562
nll mean: 118.64998626708984 	 kl mean: 8.431913375854492 	 loss mean: 127.0819091796875
nll mean: 118.76775360107422 	 kl mean: 8.431913375854492 	 loss mean: 127.19966125488281


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
 30%|███       | 3/10 [00:00<00:00, 24.74it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.68it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.76it/s][A

nll mean: 118.51161193847656 	 kl mean: 8.431913375854492 	 loss mean: 126.94352722167969
nll mean: 117.8888168334961 	 kl mean: 8.431913375854492 	 loss mean: 126.32073211669922
nll mean: 119.07376098632812 	 kl mean: 8.431913375854492 	 loss mean: 127.50567626953125
nll mean: 118.57913208007812 	 kl mean: 8.431913375854492 	 loss mean: 127.01103210449219
nll mean: 118.58674621582031 	 kl mean: 8.431913375854492 	 loss mean: 127.0186538696289


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
100%|██████████| 10/10 [00:00<00:00, 24.72it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 30%|███       | 3/10 [00:00<00:00, 21.69it/s][A

nll mean: 118.24482727050781 	 kl mean: 8.431913375854492 	 loss mean: 126.67675018310547
nll mean: 140.91314697265625 	 kl mean: 8.467796325683594 	 loss mean: 149.38095092773438
nll mean: 141.447509765625 	 kl mean: 8.467796325683594 	 loss mean: 149.91531372070312
nll mean: 140.6238555908203 	 kl mean: 8.467796325683594 	 loss mean: 149.09164428710938
nll mean: 140.7313232421875 	 kl mean: 8.467796325683594 	 loss mean: 149.19911193847656


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 30%|███       | 3/10 [00:00<00:00, 21.69it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.54it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.41it/s][A

nll mean: 140.74447631835938 	 kl mean: 8.467796325683594 	 loss mean: 149.2122802734375
nll mean: 141.30599975585938 	 kl mean: 8.467796325683594 	 loss mean: 149.7738037109375
nll mean: 140.7344207763672 	 kl mean: 8.467796325683594 	 loss mean: 149.20220947265625
nll mean: 141.43777465820312 	 kl mean: 8.467796325683594 	 loss mean: 149.90557861328125
nll mean: 141.1678924560547 	 kl mean: 8.467796325683594 	 loss mean: 149.6356964111328


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
100%|██████████| 10/10 [00:00<00:00, 21.18it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.89it/s][A

nll mean: 140.51007080078125 	 kl mean: 8.467796325683594 	 loss mean: 148.97787475585938
nll mean: 119.12652587890625 	 kl mean: 8.59539794921875 	 loss mean: 127.721923828125
nll mean: 119.72329711914062 	 kl mean: 8.59539794921875 	 loss mean: 128.31869506835938


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 20%|██        | 2/10 [00:00<00:00, 12.89it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 40%|████      | 4/10 [00:00<00:00, 12.82it/s][A

nll mean: 119.5929946899414 	 kl mean: 8.59539794921875 	 loss mean: 128.1884002685547
nll mean: 119.33344268798828 	 kl mean: 8.59539794921875 	 loss mean: 127.92884826660156
nll mean: 119.01436614990234 	 kl mean: 8.59539794921875 	 loss mean: 127.6097640991211


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 40%|████      | 4/10 [00:00<00:00, 12.82it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.67it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.60it/s][A

nll mean: 119.47742462158203 	 kl mean: 8.59539794921875 	 loss mean: 128.07281494140625
nll mean: 119.8214111328125 	 kl mean: 8.59539794921875 	 loss mean: 128.41680908203125
nll mean: 118.75505065917969 	 kl mean: 8.59539794921875 	 loss mean: 127.35045623779297


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.60it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.51it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:00, 10.00it/s][A

nll mean: 119.30363464355469 	 kl mean: 8.59539794921875 	 loss mean: 127.8990249633789
nll mean: 119.50550842285156 	 kl mean: 8.59539794921875 	 loss mean: 128.10089111328125
nll mean: 158.4339141845703 	 kl mean: 9.562443733215332 	 loss mean: 167.99636840820312


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
 10%|█         | 1/10 [00:00<00:00, 10.00it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
 20%|██        | 2/10 [00:00<00:00,  9.95it/s][A
                                               [A


nll mean: 159.0546417236328 	 kl mean: 9.562443733215332 	 loss mean: 168.61709594726562
nll mean: 159.600830078125 	 kl mean: 9.562443733215332 	 loss mean: 169.16326904296875


 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
 30%|███       | 3/10 [00:00<00:00,  9.92it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 40%|████      | 4/10 [00:00<00:00,  9.94it/s][A

nll mean: 159.001708984375 	 kl mean: 9.562443733215332 	 loss mean: 168.5641632080078
nll mean: 158.72320556640625 	 kl mean: 9.562443733215332 	 loss mean: 168.28564453125
nll mean: 158.49057006835938 	 kl mean: 9.562443733215332 	 loss mean: 168.05300903320312



                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.99it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.94it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.92it/s][A

nll mean: 159.15191650390625 	 kl mean: 9.562443733215332 	 loss mean: 168.71435546875
nll mean: 158.81124877929688 	 kl mean: 9.562443733215332 	 loss mean: 168.3737030029297


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.92it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.91it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.90it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 158.95440673828125 	 kl mean: 9.562443733215332 	 loss mean: 168.51686096191406
nll mean: 158.8761749267578 	 kl mean: 9.562443733215332 	 loss mean: 168.43861389160156
nll mean: 134.68661499023438 	 kl mean: 8.247685432434082 	 loss mean: 142.93429565429688


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.16it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 17.97it/s][A

nll mean: 134.2762451171875 	 kl mean: 8.247685432434082 	 loss mean: 142.52392578125
nll mean: 134.8006591796875 	 kl mean: 8.247685432434082 	 loss mean: 143.04835510253906
nll mean: 134.66119384765625 	 kl mean: 8.247685432434082 	 loss mean: 142.90887451171875
nll mean: 135.18624877929688 	 kl mean: 8.247685432434082 	 loss mean: 143.4339599609375


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 17.97it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 17.93it/s][A
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 17.93it/s][A

nll mean: 135.0169677734375 	 kl mean: 8.247685432434082 	 loss mean: 143.26466369628906
nll mean: 134.3538818359375 	 kl mean: 8.247685432434082 	 loss mean: 142.60157775878906
nll mean: 135.3530731201172 	 kl mean: 8.247685432434082 	 loss mean: 143.6007537841797
nll mean: 135.10809326171875 	 kl mean: 8.247685432434082 	 loss mean: 143.35580444335938


                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 17.93it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.81it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.52it/s][A

nll mean: 135.405517578125 	 kl mean: 8.247685432434082 	 loss mean: 143.6531982421875
nll mean: 143.0419921875 	 kl mean: 8.42194652557373 	 loss mean: 151.46392822265625
nll mean: 142.94976806640625 	 kl mean: 8.42194652557373 	 loss mean: 151.37173461914062


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 20%|██        | 2/10 [00:00<00:00, 10.52it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 10.55it/s][A

nll mean: 143.2703094482422 	 kl mean: 8.42194652557373 	 loss mean: 151.6922607421875
nll mean: 143.19131469726562 	 kl mean: 8.42194652557373 	 loss mean: 151.61325073242188
nll mean: 142.38632202148438 	 kl mean: 8.42194652557373 	 loss mean: 150.80825805664062


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 10.55it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.56it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.54it/s][A

nll mean: 143.41693115234375 	 kl mean: 8.42194652557373 	 loss mean: 151.8388671875
nll mean: 143.0120849609375 	 kl mean: 8.42194652557373 	 loss mean: 151.43402099609375
nll mean: 142.52035522460938 	 kl mean: 8.42194652557373 	 loss mean: 150.94232177734375


                                               
 39%|███▉      | 15/38 [00:10<00:15,  1.49it/s]
                                               [A
 39%|███▉      | 15/38 [00:10<00:15,  1.49it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.54it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.49it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 143.04306030273438 	 kl mean: 8.42194652557373 	 loss mean: 151.4650115966797
nll mean: 143.42384338378906 	 kl mean: 8.42194652557373 	 loss mean: 151.84579467773438
nll mean: 143.2390594482422 	 kl mean: 8.146373748779297 	 loss mean: 151.3854217529297
nll mean: 143.57232666015625 	 kl mean: 8.146373748779297 	 loss mean: 151.7187042236328


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00, 23.86it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
 60%|██████    | 6/10 [00:00<00:00, 23.67it/s][A

nll mean: 143.51312255859375 	 kl mean: 8.146373748779297 	 loss mean: 151.6595001220703
nll mean: 143.41189575195312 	 kl mean: 8.146373748779297 	 loss mean: 151.55825805664062
nll mean: 143.345947265625 	 kl mean: 8.146373748779297 	 loss mean: 151.49234008789062
nll mean: 143.87667846679688 	 kl mean: 8.146373748779297 	 loss mean: 152.02304077148438
nll mean: 142.84280395507812 	 kl mean: 8.146373748779297 	 loss mean: 150.9891815185547


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
 60%|██████    | 6/10 [00:00<00:00, 23.67it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
100%|██████████| 10/10 [00:00<00:00, 23.56it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.52it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.52it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 143.4342041015625 	 kl mean: 8.146373748779297 	 loss mean: 151.58056640625
nll mean: 143.28602600097656 	 kl mean: 8.146373748779297 	 loss mean: 151.43240356445312
nll mean: 143.1022186279297 	 kl mean: 8.146373748779297 	 loss mean: 151.24859619140625
nll mean: 132.5159912109375 	 kl mean: 8.505706787109375 	 loss mean: 141.02169799804688
nll mean: 131.9358673095703 	 kl mean: 8.505706787109375 	 loss mean: 140.4415740966797


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.52it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.52it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 25.06it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.00it/s][A

nll mean: 132.01068115234375 	 kl mean: 8.505706787109375 	 loss mean: 140.5164031982422
nll mean: 132.63819885253906 	 kl mean: 8.505706787109375 	 loss mean: 141.14390563964844
nll mean: 131.84217834472656 	 kl mean: 8.505706787109375 	 loss mean: 140.347900390625
nll mean: 132.3188934326172 	 kl mean: 8.505706787109375 	 loss mean: 140.8245849609375
nll mean: 132.356201171875 	 kl mean: 8.505706787109375 	 loss mean: 140.8618927001953


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.52it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.00it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.52it/s]
100%|██████████| 10/10 [00:00<00:00, 24.83it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.72it/s]
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 132.05899047851562 	 kl mean: 8.505706787109375 	 loss mean: 140.56468200683594
nll mean: 132.0526885986328 	 kl mean: 8.505706787109375 	 loss mean: 140.55838012695312
nll mean: 132.1646728515625 	 kl mean: 8.505706787109375 	 loss mean: 140.67037963867188
nll mean: 129.0432891845703 	 kl mean: 9.39427661895752 	 loss mean: 138.43756103515625


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 20%|██        | 2/10 [00:00<00:00, 12.64it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.65it/s][A

nll mean: 128.40155029296875 	 kl mean: 9.39427661895752 	 loss mean: 137.7958221435547
nll mean: 128.97021484375 	 kl mean: 9.39427661895752 	 loss mean: 138.36448669433594
nll mean: 128.96090698242188 	 kl mean: 9.39427661895752 	 loss mean: 138.35519409179688


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 40%|████      | 4/10 [00:00<00:00, 12.65it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.61it/s][A

nll mean: 128.59579467773438 	 kl mean: 9.39427661895752 	 loss mean: 137.99008178710938
nll mean: 128.4610137939453 	 kl mean: 9.39427661895752 	 loss mean: 137.85528564453125
nll mean: 128.69183349609375 	 kl mean: 9.39427661895752 	 loss mean: 138.08612060546875


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.61it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.70it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.68it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 128.86477661132812 	 kl mean: 9.39427661895752 	 loss mean: 138.259033203125
nll mean: 129.0108642578125 	 kl mean: 9.39427661895752 	 loss mean: 138.40512084960938
nll mean: 128.68479919433594 	 kl mean: 9.39427661895752 	 loss mean: 138.07908630371094


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 12.71it/s][A

nll mean: 147.57894897460938 	 kl mean: 8.66619873046875 	 loss mean: 156.24514770507812
nll mean: 146.98057556152344 	 kl mean: 8.66619873046875 	 loss mean: 155.64675903320312
nll mean: 147.18093872070312 	 kl mean: 8.66619873046875 	 loss mean: 155.84713745117188


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 12.71it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 40%|████      | 4/10 [00:00<00:00, 12.70it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.68it/s][A

nll mean: 147.41796875 	 kl mean: 8.66619873046875 	 loss mean: 156.08416748046875
nll mean: 147.18910217285156 	 kl mean: 8.66619873046875 	 loss mean: 155.8553009033203
nll mean: 147.19989013671875 	 kl mean: 8.66619873046875 	 loss mean: 155.8660888671875


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.68it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.72it/s][A

nll mean: 146.995849609375 	 kl mean: 8.66619873046875 	 loss mean: 155.6620635986328
nll mean: 147.18829345703125 	 kl mean: 8.66619873046875 	 loss mean: 155.8544921875
nll mean: 147.01205444335938 	 kl mean: 8.66619873046875 	 loss mean: 155.6782684326172


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.72it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.67it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 13.10it/s][A

nll mean: 147.0245361328125 	 kl mean: 8.66619873046875 	 loss mean: 155.69073486328125
nll mean: 154.8365020751953 	 kl mean: 8.359926223754883 	 loss mean: 163.19642639160156
nll mean: 155.0438995361328 	 kl mean: 8.359926223754883 	 loss mean: 163.40382385253906


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 20%|██        | 2/10 [00:00<00:00, 13.10it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 40%|████      | 4/10 [00:00<00:00, 12.93it/s][A

nll mean: 154.909912109375 	 kl mean: 8.359926223754883 	 loss mean: 163.26983642578125
nll mean: 154.74224853515625 	 kl mean: 8.359926223754883 	 loss mean: 163.1021728515625
nll mean: 154.82533264160156 	 kl mean: 8.359926223754883 	 loss mean: 163.18527221679688


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 40%|████      | 4/10 [00:00<00:00, 12.93it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.88it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.86it/s][A

nll mean: 155.28550720214844 	 kl mean: 8.359926223754883 	 loss mean: 163.64541625976562
nll mean: 154.83546447753906 	 kl mean: 8.359926223754883 	 loss mean: 163.1953887939453
nll mean: 155.01934814453125 	 kl mean: 8.359926223754883 	 loss mean: 163.3792724609375


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.86it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.80it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 154.81533813476562 	 kl mean: 8.359926223754883 	 loss mean: 163.17527770996094
nll mean: 154.71047973632812 	 kl mean: 8.359926223754883 	 loss mean: 163.07040405273438
nll mean: 116.5709457397461 	 kl mean: 8.396718978881836 	 loss mean: 124.96766662597656


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 10.29it/s][A
                                               [A

nll mean: 116.97677612304688 	 kl mean: 8.396718978881836 	 loss mean: 125.37348175048828
nll mean: 116.10038757324219 	 kl mean: 8.396718978881836 	 loss mean: 124.49710083007812



 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 30%|███       | 3/10 [00:00<00:00, 10.18it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 40%|████      | 4/10 [00:00<00:00, 10.11it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.07it/s][A

nll mean: 116.77472686767578 	 kl mean: 8.396718978881836 	 loss mean: 125.17144775390625
nll mean: 116.62164306640625 	 kl mean: 8.396718978881836 	 loss mean: 125.01836395263672


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.07it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.00it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.98it/s][A

nll mean: 116.61519622802734 	 kl mean: 8.396718978881836 	 loss mean: 125.01190185546875
nll mean: 115.95112609863281 	 kl mean: 8.396718978881836 	 loss mean: 124.34783935546875


                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.98it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.94it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.88it/s][A

nll mean: 117.02061462402344 	 kl mean: 8.396718978881836 	 loss mean: 125.4173355102539
nll mean: 116.67304229736328 	 kl mean: 8.396718978881836 	 loss mean: 125.06975555419922


                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
100%|██████████| 10/10 [00:01<00:00,  9.99it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 31.83it/s][A

nll mean: 115.74092864990234 	 kl mean: 8.396718978881836 	 loss mean: 124.13763427734375
nll mean: 106.16217041015625 	 kl mean: 7.556591987609863 	 loss mean: 113.71876525878906
nll mean: 105.7350082397461 	 kl mean: 7.556591987609863 	 loss mean: 113.29159545898438
nll mean: 105.86494445800781 	 kl mean: 7.556591987609863 	 loss mean: 113.42153930664062
nll mean: 105.82833099365234 	 kl mean: 7.556591987609863 	 loss mean: 113.38491821289062
nll mean: 105.87680053710938 	 kl mean: 7.556591987609863 	 loss mean: 113.43339538574219
nll mean: 105.41310119628906 	 kl mean: 7.556591987609863 	 loss mean: 112.96969604492188


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 31.83it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
100%|██████████| 10/10 [00:00<00:00, 31.26it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 105.51260375976562 	 kl mean: 7.556591987609863 	 loss mean: 113.0691909790039
nll mean: 106.51606750488281 	 kl mean: 7.556591987609863 	 loss mean: 114.07266235351562
nll mean: 106.23582458496094 	 kl mean: 7.556591987609863 	 loss mean: 113.79241180419922
nll mean: 105.46359252929688 	 kl mean: 7.556591987609863 	 loss mean: 113.02018737792969
nll mean: 155.78515625 	 kl mean: 8.635913848876953 	 loss mean: 164.42108154296875


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
 20%|██        | 2/10 [00:00<00:00, 14.30it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.32it/s][A

nll mean: 156.03451538085938 	 kl mean: 8.635913848876953 	 loss mean: 164.67042541503906
nll mean: 156.24331665039062 	 kl mean: 8.635913848876953 	 loss mean: 164.87924194335938
nll mean: 156.26657104492188 	 kl mean: 8.635913848876953 	 loss mean: 164.90248107910156


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
 40%|████      | 4/10 [00:00<00:00, 14.32it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.34it/s][A

nll mean: 156.4676513671875 	 kl mean: 8.635913848876953 	 loss mean: 165.10357666015625
nll mean: 156.30862426757812 	 kl mean: 8.635913848876953 	 loss mean: 164.94454956054688
nll mean: 156.19384765625 	 kl mean: 8.635913848876953 	 loss mean: 164.8297576904297


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.34it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.31it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.32it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.49it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 156.32923889160156 	 kl mean: 8.635913848876953 	 loss mean: 164.9651641845703
nll mean: 155.99375915527344 	 kl mean: 8.635913848876953 	 loss mean: 164.62966918945312
nll mean: 156.4200897216797 	 kl mean: 8.635913848876953 	 loss mean: 165.05599975585938
nll mean: 119.69497680664062 	 kl mean: 9.443400382995605 	 loss mean: 129.1383819580078


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.49it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.49it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.49it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.49it/s]
 30%|███       | 3/10 [00:00<00:00, 21.40it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.41it/s][A

nll mean: 119.48826599121094 	 kl mean: 9.443400382995605 	 loss mean: 128.93165588378906
nll mean: 119.25700378417969 	 kl mean: 9.443400382995605 	 loss mean: 128.70040893554688
nll mean: 119.0458755493164 	 kl mean: 9.443400382995605 	 loss mean: 128.48927307128906
nll mean: 119.18490600585938 	 kl mean: 9.443400382995605 	 loss mean: 128.62831115722656
nll mean: 119.5726547241211 	 kl mean: 9.443400382995605 	 loss mean: 129.01605224609375


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.49it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.49it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.49it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.41it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.49it/s]
100%|██████████| 10/10 [00:00<00:00, 21.17it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.14910888671875 	 kl mean: 9.443400382995605 	 loss mean: 129.59249877929688
nll mean: 120.12724304199219 	 kl mean: 9.443400382995605 	 loss mean: 129.57064819335938
nll mean: 119.70892333984375 	 kl mean: 9.443400382995605 	 loss mean: 129.15231323242188
nll mean: 119.68991088867188 	 kl mean: 9.443400382995605 	 loss mean: 129.13330078125


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.63it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
 20%|██        | 2/10 [00:00<00:00, 14.83it/s][A

nll mean: 113.78074645996094 	 kl mean: 7.590457916259766 	 loss mean: 121.37120056152344
nll mean: 113.55366516113281 	 kl mean: 7.590457916259766 	 loss mean: 121.14413452148438
nll mean: 113.62299346923828 	 kl mean: 7.590457916259766 	 loss mean: 121.21345520019531


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
 20%|██        | 2/10 [00:00<00:00, 14.83it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
 40%|████      | 4/10 [00:00<00:00, 14.80it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.74it/s][A

nll mean: 113.74784088134766 	 kl mean: 7.590457916259766 	 loss mean: 121.33830261230469
nll mean: 113.36503601074219 	 kl mean: 7.590457916259766 	 loss mean: 120.95549011230469
nll mean: 113.7458267211914 	 kl mean: 7.590457916259766 	 loss mean: 121.3362808227539


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.74it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.70it/s][A

nll mean: 114.07878875732422 	 kl mean: 7.590457916259766 	 loss mean: 121.66925048828125
nll mean: 114.04434204101562 	 kl mean: 7.590457916259766 	 loss mean: 121.63479614257812
nll mean: 114.02069854736328 	 kl mean: 7.590457916259766 	 loss mean: 121.61115264892578


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.63it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.70it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.68it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.58it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.58it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.58it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.58it/s]
 30%|███       | 3/10 [00:00<00:00, 22.40it/s][A

nll mean: 113.40135192871094 	 kl mean: 7.590457916259766 	 loss mean: 120.99180603027344
nll mean: 81.96832275390625 	 kl mean: 7.460407733917236 	 loss mean: 89.42872619628906
nll mean: 81.55716705322266 	 kl mean: 7.460407733917236 	 loss mean: 89.017578125
nll mean: 81.7629623413086 	 kl mean: 7.460407733917236 	 loss mean: 89.2233657836914
nll mean: 81.82637023925781 	 kl mean: 7.460407733917236 	 loss mean: 89.28678894042969


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.58it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.58it/s]
 30%|███       | 3/10 [00:00<00:00, 22.40it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.58it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.58it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.44it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.11it/s][A

nll mean: 81.65219116210938 	 kl mean: 7.460407733917236 	 loss mean: 89.11259460449219
nll mean: 81.77198791503906 	 kl mean: 7.460407733917236 	 loss mean: 89.2323989868164
nll mean: 81.87828063964844 	 kl mean: 7.460407733917236 	 loss mean: 89.33868408203125
nll mean: 81.99519348144531 	 kl mean: 7.460407733917236 	 loss mean: 89.45560455322266
nll mean: 82.00497436523438 	 kl mean: 7.460407733917236 	 loss mean: 89.46538543701172


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.58it/s]
100%|██████████| 10/10 [00:00<00:00, 22.17it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.72it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
 30%|███       | 3/10 [00:00<00:00, 21.73it/s][A

nll mean: 81.17582702636719 	 kl mean: 7.460407733917236 	 loss mean: 88.63623809814453
nll mean: 107.42897033691406 	 kl mean: 7.924598693847656 	 loss mean: 115.35356903076172
nll mean: 107.89891052246094 	 kl mean: 7.924598693847656 	 loss mean: 115.82351684570312
nll mean: 107.85157775878906 	 kl mean: 7.924598693847656 	 loss mean: 115.77617645263672
nll mean: 107.64167785644531 	 kl mean: 7.924598693847656 	 loss mean: 115.56626892089844


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
 30%|███       | 3/10 [00:00<00:00, 21.73it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.74it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.77it/s][A

nll mean: 107.87510681152344 	 kl mean: 7.924598693847656 	 loss mean: 115.79969787597656
nll mean: 107.77645874023438 	 kl mean: 7.924598693847656 	 loss mean: 115.7010498046875
nll mean: 108.12478637695312 	 kl mean: 7.924598693847656 	 loss mean: 116.04939270019531
nll mean: 107.90568542480469 	 kl mean: 7.924598693847656 	 loss mean: 115.83029174804688
nll mean: 108.05020904541016 	 kl mean: 7.924598693847656 	 loss mean: 115.97480010986328


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
100%|██████████| 10/10 [00:00<00:00, 21.78it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.30it/s][A

nll mean: 108.11613464355469 	 kl mean: 7.924598693847656 	 loss mean: 116.04073333740234
nll mean: 119.17056274414062 	 kl mean: 8.479338645935059 	 loss mean: 127.64990234375
nll mean: 119.29241943359375 	 kl mean: 8.479338645935059 	 loss mean: 127.77175903320312


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.30it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 40%|████      | 4/10 [00:00<00:00, 12.22it/s][A

nll mean: 119.24073028564453 	 kl mean: 8.479338645935059 	 loss mean: 127.7200698852539
nll mean: 120.0662841796875 	 kl mean: 8.479338645935059 	 loss mean: 128.5456085205078
nll mean: 119.87606811523438 	 kl mean: 8.479338645935059 	 loss mean: 128.35540771484375


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 40%|████      | 4/10 [00:00<00:00, 12.22it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.26it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.32it/s][A

nll mean: 119.36956787109375 	 kl mean: 8.479338645935059 	 loss mean: 127.8488998413086
nll mean: 119.2958984375 	 kl mean: 8.479338645935059 	 loss mean: 127.77523040771484
nll mean: 120.09664154052734 	 kl mean: 8.479338645935059 	 loss mean: 128.57598876953125


                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.32it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.32it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 119.49235534667969 	 kl mean: 8.479338645935059 	 loss mean: 127.97169494628906
nll mean: 119.48735046386719 	 kl mean: 8.479338645935059 	 loss mean: 127.9666976928711
nll mean: 61.50684356689453 	 kl mean: 8.613973617553711 	 loss mean: 70.12081909179688


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 20%|██        | 2/10 [00:00<00:00, 10.09it/s][A
                                               [A

nll mean: 61.79957580566406 	 kl mean: 8.613973617553711 	 loss mean: 70.41354370117188
nll mean: 62.257537841796875 	 kl mean: 8.613973617553711 	 loss mean: 70.87151336669922



 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00, 10.05it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 40%|████      | 4/10 [00:00<00:00, 10.02it/s][A
                                               [A


nll mean: 62.080230712890625 	 kl mean: 8.613973617553711 	 loss mean: 70.69420623779297
nll mean: 61.474205017089844 	 kl mean: 8.613973617553711 	 loss mean: 70.08818054199219


 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.00it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.98it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.08it/s][A

nll mean: 62.084617614746094 	 kl mean: 8.613973617553711 	 loss mean: 70.6985855102539
nll mean: 61.35862731933594 	 kl mean: 8.613973617553711 	 loss mean: 69.97260284423828
nll mean: 61.39535140991211 	 kl mean: 8.613973617553711 	 loss mean: 70.00933074951172


                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s]
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.08it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.10it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 61.78473663330078 	 kl mean: 8.613973617553711 	 loss mean: 70.39871215820312
nll mean: 61.27570724487305 	 kl mean: 8.613973617553711 	 loss mean: 69.88967895507812
nll mean: 104.72491455078125 	 kl mean: 8.073014259338379 	 loss mean: 112.79792022705078


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 20%|██        | 2/10 [00:00<00:00, 12.75it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.66it/s][A

nll mean: 104.6593246459961 	 kl mean: 8.073014259338379 	 loss mean: 112.73234558105469
nll mean: 104.93941497802734 	 kl mean: 8.073014259338379 	 loss mean: 113.01242065429688
nll mean: 104.79948425292969 	 kl mean: 8.073014259338379 	 loss mean: 112.87249755859375


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 40%|████      | 4/10 [00:00<00:00, 12.66it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.79it/s][A

nll mean: 105.02610778808594 	 kl mean: 8.073014259338379 	 loss mean: 113.09912109375
nll mean: 104.48672485351562 	 kl mean: 8.073014259338379 	 loss mean: 112.55973815917969
nll mean: 104.52359008789062 	 kl mean: 8.073014259338379 	 loss mean: 112.59660339355469


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.79it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:20<00:05,  1.36it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.82it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.74it/s][A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 104.44353485107422 	 kl mean: 8.073014259338379 	 loss mean: 112.51654815673828
nll mean: 104.8316650390625 	 kl mean: 8.073014259338379 	 loss mean: 112.90467834472656
nll mean: 104.9999008178711 	 kl mean: 8.073014259338379 	 loss mean: 113.07291412353516


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 10%|█         | 1/10 [00:00<00:00,  9.95it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]

nll mean: 137.48825073242188 	 kl mean: 8.777030944824219 	 loss mean: 146.26527404785156
nll mean: 137.9171142578125 	 kl mean: 8.777030944824219 	 loss mean: 146.69415283203125
nll mean: 137.8284912109375 	 kl mean: 8.777030944824219 	 loss mean: 146.6055145263672



                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 20%|██        | 2/10 [00:00<00:00,  9.96it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 40%|████      | 4/10 [00:00<00:00,  9.99it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.93it/s][A

nll mean: 137.780029296875 	 kl mean: 8.777030944824219 	 loss mean: 146.55706787109375
nll mean: 137.53785705566406 	 kl mean: 8.777030944824219 	 loss mean: 146.3148956298828


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.93it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.90it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.88it/s][A

nll mean: 138.0566864013672 	 kl mean: 8.777030944824219 	 loss mean: 146.83370971679688
nll mean: 137.98452758789062 	 kl mean: 8.777030944824219 	 loss mean: 146.7615509033203


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.88it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.87it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.86it/s][A

nll mean: 138.3150177001953 	 kl mean: 8.777030944824219 	 loss mean: 147.092041015625
nll mean: 137.77008056640625 	 kl mean: 8.777030944824219 	 loss mean: 146.547119140625


                                               
 82%|████████▏ | 31/38 [00:21<00:05,  1.33it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.86it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.89it/s][A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 30%|███       | 3/10 [00:00<00:00, 26.24it/s][A

nll mean: 137.95309448242188 	 kl mean: 8.777030944824219 	 loss mean: 146.73013305664062
nll mean: 64.62813568115234 	 kl mean: 6.814316749572754 	 loss mean: 71.44245147705078
nll mean: 65.02468872070312 	 kl mean: 6.814316749572754 	 loss mean: 71.83900451660156
nll mean: 64.59688568115234 	 kl mean: 6.814316749572754 	 loss mean: 71.41120910644531
nll mean: 64.60128784179688 	 kl mean: 6.814316749572754 	 loss mean: 71.41560363769531
nll mean: 64.85537719726562 	 kl mean: 6.814316749572754 	 loss mean: 71.66969299316406


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 30%|███       | 3/10 [00:00<00:00, 26.24it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 60%|██████    | 6/10 [00:00<00:00, 26.03it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
100%|██████████| 10/10 [00:00<00:00, 25.63it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 64.91078186035156 	 kl mean: 6.814316749572754 	 loss mean: 71.72509002685547
nll mean: 64.98480224609375 	 kl mean: 6.814316749572754 	 loss mean: 71.79912567138672
nll mean: 64.96099090576172 	 kl mean: 6.814316749572754 	 loss mean: 71.77530670166016
nll mean: 64.53903198242188 	 kl mean: 6.814316749572754 	 loss mean: 71.35334777832031
nll mean: 64.84513092041016 	 kl mean: 6.814316749572754 	 loss mean: 71.6594467163086


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 30%|███       | 3/10 [00:00<00:00, 21.75it/s][A

nll mean: 119.50575256347656 	 kl mean: 7.8289337158203125 	 loss mean: 127.33468627929688
nll mean: 118.99390411376953 	 kl mean: 7.8289337158203125 	 loss mean: 126.82283782958984
nll mean: 119.14701843261719 	 kl mean: 7.8289337158203125 	 loss mean: 126.9759521484375
nll mean: 119.48765563964844 	 kl mean: 7.8289337158203125 	 loss mean: 127.31659698486328
nll mean: 119.4013671875 	 kl mean: 7.8289337158203125 	 loss mean: 127.23030090332031


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 30%|███       | 3/10 [00:00<00:00, 21.75it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.93it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
100%|██████████| 10/10 [00:00<00:00, 21.77it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 119.21837615966797 	 kl mean: 7.8289337158203125 	 loss mean: 127.04730987548828
nll mean: 119.22759246826172 	 kl mean: 7.8289337158203125 	 loss mean: 127.0565185546875
nll mean: 119.25086975097656 	 kl mean: 7.8289337158203125 	 loss mean: 127.0798110961914
nll mean: 119.00753784179688 	 kl mean: 7.8289337158203125 	 loss mean: 126.83648681640625
nll mean: 119.33187866210938 	 kl mean: 7.8289337158203125 	 loss mean: 127.16081237792969


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 12.39it/s][A

nll mean: 120.38177490234375 	 kl mean: 8.234020233154297 	 loss mean: 128.61578369140625
nll mean: 120.7445068359375 	 kl mean: 8.234020233154297 	 loss mean: 128.978515625
nll mean: 120.47931671142578 	 kl mean: 8.234020233154297 	 loss mean: 128.71334838867188


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 12.39it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 40%|████      | 4/10 [00:00<00:00, 12.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.57it/s][A

nll mean: 119.98800659179688 	 kl mean: 8.234020233154297 	 loss mean: 128.22203063964844
nll mean: 120.20521545410156 	 kl mean: 8.234020233154297 	 loss mean: 128.43923950195312
nll mean: 120.6234130859375 	 kl mean: 8.234020233154297 	 loss mean: 128.85743713378906


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.57it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.76it/s][A

nll mean: 120.35794067382812 	 kl mean: 8.234020233154297 	 loss mean: 128.59194946289062
nll mean: 120.24774169921875 	 kl mean: 8.234020233154297 	 loss mean: 128.4817657470703
nll mean: 120.03111267089844 	 kl mean: 8.234020233154297 	 loss mean: 128.26513671875


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.76it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.74it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.77it/s][A

nll mean: 119.94029235839844 	 kl mean: 8.234020233154297 	 loss mean: 128.17431640625
nll mean: 113.1659927368164 	 kl mean: 8.005974769592285 	 loss mean: 121.1719741821289
nll mean: 112.85287475585938 	 kl mean: 8.005974769592285 	 loss mean: 120.85884857177734


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 10.77it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 10.73it/s][A

nll mean: 113.201904296875 	 kl mean: 8.005974769592285 	 loss mean: 121.20787811279297
nll mean: 113.3565444946289 	 kl mean: 8.005974769592285 	 loss mean: 121.3625259399414
nll mean: 113.90437316894531 	 kl mean: 8.005974769592285 	 loss mean: 121.91034698486328


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 10.73it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.68it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.69it/s][A

nll mean: 113.62384796142578 	 kl mean: 8.005974769592285 	 loss mean: 121.62982177734375
nll mean: 113.822021484375 	 kl mean: 8.005974769592285 	 loss mean: 121.8280029296875
nll mean: 113.35135650634766 	 kl mean: 8.005974769592285 	 loss mean: 121.35733032226562


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.69it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.65it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 113.13986206054688 	 kl mean: 8.005974769592285 	 loss mean: 121.14583587646484
nll mean: 113.05775451660156 	 kl mean: 8.005974769592285 	 loss mean: 121.063720703125
nll mean: 110.9993896484375 	 kl mean: 8.296426773071289 	 loss mean: 119.29582214355469
nll mean: 111.18634033203125 	 kl mean: 8.296426773071289 	 loss mean: 119.48277282714844


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00, 21.63it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.60it/s][A

nll mean: 111.288330078125 	 kl mean: 8.296426773071289 	 loss mean: 119.58474731445312
nll mean: 111.6714859008789 	 kl mean: 8.296426773071289 	 loss mean: 119.96791076660156
nll mean: 110.87687683105469 	 kl mean: 8.296426773071289 	 loss mean: 119.17330932617188
nll mean: 111.21072387695312 	 kl mean: 8.296426773071289 	 loss mean: 119.50715637207031
nll mean: 111.59611511230469 	 kl mean: 8.296426773071289 	 loss mean: 119.89253997802734


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.32it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.60it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.32it/s]
100%|██████████| 10/10 [00:00<00:00, 21.54it/s][A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 111.0285873413086 	 kl mean: 8.296426773071289 	 loss mean: 119.32501983642578
nll mean: 111.35128784179688 	 kl mean: 8.296426773071289 	 loss mean: 119.64771270751953
nll mean: 111.31672668457031 	 kl mean: 8.296426773071289 	 loss mean: 119.61315155029297
nll mean: 85.05127716064453 	 kl mean: 7.965381622314453 	 loss mean: 93.01666259765625
nll mean: 86.12249755859375 	 kl mean: 7.965381622314453 	 loss mean: 94.08787536621094
nll mean: 85.1331787109375 	 kl mean: 7.965381622314453 	 loss mean: 93.09856414794922


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
 40%|████      | 4/10 [00:00<00:00, 31.00it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.50it/s]
100%|██████████| 10/10 [00:00<00:00, 30.71it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.56it/s]


nll mean: 85.31280517578125 	 kl mean: 7.965381622314453 	 loss mean: 93.27818298339844
nll mean: 84.9037857055664 	 kl mean: 7.965381622314453 	 loss mean: 92.8691635131836
nll mean: 85.41439056396484 	 kl mean: 7.965381622314453 	 loss mean: 93.3797607421875
nll mean: 85.51506042480469 	 kl mean: 7.965381622314453 	 loss mean: 93.48043823242188
nll mean: 85.08480072021484 	 kl mean: 7.965381622314453 	 loss mean: 93.0501708984375
nll mean: 84.74919128417969 	 kl mean: 7.965381622314453 	 loss mean: 92.71456146240234
nll mean: 84.94896697998047 	 kl mean: 7.965381622314453 	 loss mean: 92.91435241699219
Approximate NLL:
tensor(120.7947, device='cuda:0')
Approximate KL:
tensor(8.3366, device='cuda:0')
Testing took 0:00:25.413338


  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 25.42it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].42it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].42it/s][A

nll mean: 107.95982360839844 	 kl mean: 8.950788497924805 	 loss mean: 116.91061401367188
nll mean: 108.23336791992188 	 kl mean: 8.950788497924805 	 loss mean: 117.18415832519531
nll mean: 108.43281555175781 	 kl mean: 8.950788497924805 	 loss mean: 117.38360595703125
nll mean: 108.41683959960938 	 kl mean: 8.950788497924805 	 loss mean: 117.36763000488281
nll mean: 108.35636901855469 	 kl mean: 8.950788497924805 	 loss mean: 117.30715942382812



                                              
  0%|          | 0/38 [00:00<?, ?it/s].42it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.17it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].17it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].17it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].17it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.00it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 24.73it/s][A
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 107.6358642578125 	 kl mean: 8.950788497924805 	 loss mean: 116.58665466308594
nll mean: 107.87326049804688 	 kl mean: 8.950788497924805 	 loss mean: 116.82405090332031
nll mean: 108.89620208740234 	 kl mean: 8.950788497924805 	 loss mean: 117.84698486328125
nll mean: 107.91621398925781 	 kl mean: 8.950788497924805 	 loss mean: 116.86701202392578
nll mean: 108.67123413085938 	 kl mean: 8.950788497924805 	 loss mean: 117.62202453613281



                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s]
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s]
 20%|██        | 2/10 [00:00<00:00, 13.96it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A

nll mean: 126.01394653320312 	 kl mean: 8.645843505859375 	 loss mean: 134.6597900390625
nll mean: 126.08123779296875 	 kl mean: 8.645843505859375 	 loss mean: 134.72708129882812
nll mean: 126.35299682617188 	 kl mean: 8.645843505859375 	 loss mean: 134.99884033203125



                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.92it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.05it/s][A

nll mean: 125.98056030273438 	 kl mean: 8.645843505859375 	 loss mean: 134.62640380859375
nll mean: 125.65101623535156 	 kl mean: 8.645843505859375 	 loss mean: 134.29685974121094
nll mean: 125.82174682617188 	 kl mean: 8.645843505859375 	 loss mean: 134.46759033203125



                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.95it/s][A
                                              
  3%|▎         | 1/38 [00:01<00:15,  2.46it/s][A

nll mean: 126.27391052246094 	 kl mean: 8.645843505859375 	 loss mean: 134.9197540283203
nll mean: 126.28547668457031 	 kl mean: 8.645843505859375 	 loss mean: 134.93133544921875
nll mean: 125.64356231689453 	 kl mean: 8.645843505859375 	 loss mean: 134.28941345214844



                                              
  3%|▎         | 1/38 [00:01<00:15,  2.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.99it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.00it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.00it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.00it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.00it/s]
 30%|███       | 3/10 [00:00<00:00, 24.66it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.00it/s][A

nll mean: 126.0736312866211 	 kl mean: 8.645843505859375 	 loss mean: 134.719482421875
nll mean: 98.31996154785156 	 kl mean: 7.9807586669921875 	 loss mean: 106.30072021484375
nll mean: 98.48194885253906 	 kl mean: 7.9807586669921875 	 loss mean: 106.46270751953125
nll mean: 98.52892303466797 	 kl mean: 7.9807586669921875 	 loss mean: 106.50968933105469
nll mean: 98.60762023925781 	 kl mean: 7.9807586669921875 	 loss mean: 106.58837127685547



                                              
  5%|▌         | 2/38 [00:01<00:17,  2.00it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.00it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.52it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.00it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.00it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.00it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.34it/s][A

nll mean: 98.79967498779297 	 kl mean: 7.9807586669921875 	 loss mean: 106.78042602539062
nll mean: 98.36680603027344 	 kl mean: 7.9807586669921875 	 loss mean: 106.3475570678711
nll mean: 98.29627990722656 	 kl mean: 7.9807586669921875 	 loss mean: 106.27704620361328
nll mean: 98.35533905029297 	 kl mean: 7.9807586669921875 	 loss mean: 106.33609771728516
nll mean: 98.2121353149414 	 kl mean: 7.9807586669921875 	 loss mean: 106.19288635253906



                                              
100%|██████████| 10/10 [00:00<00:00, 24.33it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s]
 20%|██        | 2/10 [00:00<00:00, 10.83it/s][A

nll mean: 98.51275634765625 	 kl mean: 7.9807586669921875 	 loss mean: 106.49351501464844
nll mean: 138.67124938964844 	 kl mean: 8.130324363708496 	 loss mean: 146.8015594482422
nll mean: 138.95834350585938 	 kl mean: 8.130324363708496 	 loss mean: 147.0886688232422



                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.88it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s][A

nll mean: 138.7108612060547 	 kl mean: 8.130324363708496 	 loss mean: 146.8411865234375
nll mean: 138.83920288085938 	 kl mean: 8.130324363708496 	 loss mean: 146.9695281982422
nll mean: 139.30770874023438 	 kl mean: 8.130324363708496 	 loss mean: 147.43801879882812



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.86it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.81it/s][A

nll mean: 139.13551330566406 	 kl mean: 8.130324363708496 	 loss mean: 147.26583862304688
nll mean: 139.1876678466797 	 kl mean: 8.130324363708496 	 loss mean: 147.3179931640625
nll mean: 138.78622436523438 	 kl mean: 8.130324363708496 	 loss mean: 146.9165496826172



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.78it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]

nll mean: 138.75146484375 	 kl mean: 8.130324363708496 	 loss mean: 146.8817901611328
nll mean: 139.0942840576172 	 kl mean: 8.130324363708496 	 loss mean: 147.22462463378906
nll mean: 124.58516693115234 	 kl mean: 8.098258018493652 	 loss mean: 132.6834259033203



                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 20%|██        | 2/10 [00:00<00:00, 14.45it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.30it/s][A

nll mean: 123.98695373535156 	 kl mean: 8.098258018493652 	 loss mean: 132.085205078125
nll mean: 123.62957763671875 	 kl mean: 8.098258018493652 	 loss mean: 131.7278289794922
nll mean: 124.77371978759766 	 kl mean: 8.098258018493652 	 loss mean: 132.87197875976562



                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.24it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A

nll mean: 125.09664154052734 	 kl mean: 8.098258018493652 	 loss mean: 133.1949005126953
nll mean: 124.45890808105469 	 kl mean: 8.098258018493652 	 loss mean: 132.55715942382812
nll mean: 124.51651763916016 	 kl mean: 8.098258018493652 	 loss mean: 132.61477661132812



                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.12it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.11it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.33443450927734 	 kl mean: 8.098258018493652 	 loss mean: 132.4326934814453
nll mean: 124.3797836303711 	 kl mean: 8.098258018493652 	 loss mean: 132.47804260253906
nll mean: 124.55328369140625 	 kl mean: 8.098258018493652 	 loss mean: 132.65155029296875



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.71it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 121.97936248779297 	 kl mean: 8.220185279846191 	 loss mean: 130.19955444335938
nll mean: 122.33148956298828 	 kl mean: 8.220185279846191 	 loss mean: 130.5516815185547
nll mean: 122.23731994628906 	 kl mean: 8.220185279846191 	 loss mean: 130.45751953125



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.82it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.72it/s][A

nll mean: 122.24591064453125 	 kl mean: 8.220185279846191 	 loss mean: 130.46609497070312
nll mean: 122.54914855957031 	 kl mean: 8.220185279846191 	 loss mean: 130.7693328857422
nll mean: 122.15116119384766 	 kl mean: 8.220185279846191 	 loss mean: 130.371337890625



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.48it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 122.58442687988281 	 kl mean: 8.220185279846191 	 loss mean: 130.8046112060547
nll mean: 122.59368896484375 	 kl mean: 8.220185279846191 	 loss mean: 130.81387329101562
nll mean: 122.36439514160156 	 kl mean: 8.220185279846191 	 loss mean: 130.58457946777344



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.48it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 25.47it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A

nll mean: 122.15290832519531 	 kl mean: 8.220185279846191 	 loss mean: 130.37307739257812
nll mean: 132.67971801757812 	 kl mean: 8.236984252929688 	 loss mean: 140.9167022705078
nll mean: 133.06329345703125 	 kl mean: 8.236984252929688 	 loss mean: 141.30027770996094
nll mean: 133.02133178710938 	 kl mean: 8.236984252929688 	 loss mean: 141.25833129882812
nll mean: 133.4307861328125 	 kl mean: 8.236984252929688 	 loss mean: 141.6677703857422



                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.17it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.04it/s][A

nll mean: 132.53271484375 	 kl mean: 8.236984252929688 	 loss mean: 140.7696990966797
nll mean: 133.06057739257812 	 kl mean: 8.236984252929688 	 loss mean: 141.29757690429688
nll mean: 132.71482849121094 	 kl mean: 8.236984252929688 	 loss mean: 140.95181274414062
nll mean: 133.19436645507812 	 kl mean: 8.236984252929688 	 loss mean: 141.4313507080078
nll mean: 133.064697265625 	 kl mean: 8.236984252929688 	 loss mean: 141.30169677734375



                                              
100%|██████████| 10/10 [00:00<00:00, 24.81it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
 30%|███       | 3/10 [00:00<00:00, 25.16it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A
                                              

nll mean: 133.08140563964844 	 kl mean: 8.236984252929688 	 loss mean: 141.31837463378906
nll mean: 104.87162017822266 	 kl mean: 8.322246551513672 	 loss mean: 113.1938705444336
nll mean: 104.83950805664062 	 kl mean: 8.322246551513672 	 loss mean: 113.16175842285156
nll mean: 104.1678237915039 	 kl mean: 8.322246551513672 	 loss mean: 112.49008178710938
nll mean: 104.57283020019531 	 kl mean: 8.322246551513672 	 loss mean: 112.89508056640625


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.12it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.04it/s][A
                                              

nll mean: 104.16386413574219 	 kl mean: 8.322246551513672 	 loss mean: 112.4861068725586
nll mean: 104.37284851074219 	 kl mean: 8.322246551513672 	 loss mean: 112.69509887695312
nll mean: 104.7025146484375 	 kl mean: 8.322246551513672 	 loss mean: 113.02476501464844
nll mean: 104.93720245361328 	 kl mean: 8.322246551513672 	 loss mean: 113.25944519042969
nll mean: 104.54417419433594 	 kl mean: 8.322246551513672 	 loss mean: 112.86642456054688


                                              
100%|██████████| 10/10 [00:00<00:00, 24.95it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 15.23it/s][A

nll mean: 104.57975769042969 	 kl mean: 8.322246551513672 	 loss mean: 112.90200805664062
nll mean: 131.60401916503906 	 kl mean: 8.592019081115723 	 loss mean: 140.196044921875
nll mean: 132.39981079101562 	 kl mean: 8.592019081115723 	 loss mean: 140.99183654785156


                                              
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.90it/s]
 20%|██        | 2/10 [00:00<00:00, 15.23it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
 40%|████      | 4/10 [00:00<00:00, 15.23it/s][A
 60%|██████    | 6/10 [00:00<00:00, 15.14it/s][A

nll mean: 131.97329711914062 	 kl mean: 8.592019081115723 	 loss mean: 140.5653076171875
nll mean: 131.98974609375 	 kl mean: 8.592019081115723 	 loss mean: 140.58175659179688
nll mean: 131.5061798095703 	 kl mean: 8.592019081115723 	 loss mean: 140.09820556640625
nll mean: 132.4008026123047 	 kl mean: 8.592019081115723 	 loss mean: 140.99282836914062


                                              
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
 60%|██████    | 6/10 [00:00<00:00, 15.14it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.90it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.83it/s][A
100%|██████████| 10/10 [00:00<00:00, 15.11it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 132.32003784179688 	 kl mean: 8.592019081115723 	 loss mean: 140.91204833984375
nll mean: 131.79556274414062 	 kl mean: 8.592019081115723 	 loss mean: 140.3875732421875
nll mean: 131.7397918701172 	 kl mean: 8.592019081115723 	 loss mean: 140.33181762695312
nll mean: 131.59527587890625 	 kl mean: 8.592019081115723 	 loss mean: 140.18731689453125



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]
 30%|███       | 3/10 [00:00<00:00, 21.55it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A

nll mean: 131.80209350585938 	 kl mean: 8.340071678161621 	 loss mean: 140.14215087890625
nll mean: 131.39732360839844 	 kl mean: 8.340071678161621 	 loss mean: 139.73739624023438
nll mean: 131.68673706054688 	 kl mean: 8.340071678161621 	 loss mean: 140.0268096923828
nll mean: 132.08596801757812 	 kl mean: 8.340071678161621 	 loss mean: 140.42605590820312
nll mean: 132.07391357421875 	 kl mean: 8.340071678161621 	 loss mean: 140.41397094726562



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.51it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.47it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 21.41it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.86it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 132.42721557617188 	 kl mean: 8.340071678161621 	 loss mean: 140.7672882080078
nll mean: 131.74476623535156 	 kl mean: 8.340071678161621 	 loss mean: 140.0848388671875
nll mean: 131.93502807617188 	 kl mean: 8.340071678161621 	 loss mean: 140.27508544921875
nll mean: 131.69219970703125 	 kl mean: 8.340071678161621 	 loss mean: 140.0322723388672
nll mean: 131.33834838867188 	 kl mean: 8.340071678161621 	 loss mean: 139.67840576171875



                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.86it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.86it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.86it/s]
 30%|███       | 3/10 [00:00<00:00, 24.88it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.86it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.86it/s][A

nll mean: 119.88218688964844 	 kl mean: 8.361089706420898 	 loss mean: 128.2432861328125
nll mean: 120.0724868774414 	 kl mean: 8.361089706420898 	 loss mean: 128.43357849121094
nll mean: 120.12301635742188 	 kl mean: 8.361089706420898 	 loss mean: 128.48410034179688
nll mean: 120.49987030029297 	 kl mean: 8.361089706420898 	 loss mean: 128.8609619140625
nll mean: 120.07904052734375 	 kl mean: 8.361089706420898 	 loss mean: 128.44012451171875



                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.86it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.73it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.86it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.86it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.86it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.68it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 24.61it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 119.98555755615234 	 kl mean: 8.361089706420898 	 loss mean: 128.34664916992188
nll mean: 119.81086730957031 	 kl mean: 8.361089706420898 	 loss mean: 128.17196655273438
nll mean: 120.48805236816406 	 kl mean: 8.361089706420898 	 loss mean: 128.84915161132812
nll mean: 119.88423156738281 	 kl mean: 8.361089706420898 	 loss mean: 128.24533081054688
nll mean: 119.9720458984375 	 kl mean: 8.361089706420898 	 loss mean: 128.3331298828125



                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
 30%|███       | 3/10 [00:00<00:00, 22.06it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A

nll mean: 140.28076171875 	 kl mean: 8.36264419555664 	 loss mean: 148.64340209960938
nll mean: 139.70281982421875 	 kl mean: 8.36264419555664 	 loss mean: 148.0654754638672
nll mean: 140.38870239257812 	 kl mean: 8.36264419555664 	 loss mean: 148.75135803222656
nll mean: 140.02188110351562 	 kl mean: 8.36264419555664 	 loss mean: 148.384521484375
nll mean: 139.79969787597656 	 kl mean: 8.36264419555664 	 loss mean: 148.162353515625



                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.82it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.61it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.41it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 140.22421264648438 	 kl mean: 8.36264419555664 	 loss mean: 148.58685302734375
nll mean: 139.88461303710938 	 kl mean: 8.36264419555664 	 loss mean: 148.24725341796875
nll mean: 139.59555053710938 	 kl mean: 8.36264419555664 	 loss mean: 147.95819091796875
nll mean: 139.82199096679688 	 kl mean: 8.36264419555664 	 loss mean: 148.18466186523438
nll mean: 139.67510986328125 	 kl mean: 8.36264419555664 	 loss mean: 148.03775024414062



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s]
 20%|██        | 2/10 [00:00<00:00, 12.72it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.04it/s][A

nll mean: 119.47440338134766 	 kl mean: 8.299661636352539 	 loss mean: 127.7740478515625
nll mean: 119.11944580078125 	 kl mean: 8.299661636352539 	 loss mean: 127.41911315917969
nll mean: 119.3096923828125 	 kl mean: 8.299661636352539 	 loss mean: 127.6093521118164



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.66it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.58it/s][A

nll mean: 118.81251525878906 	 kl mean: 8.299661636352539 	 loss mean: 127.11216735839844
nll mean: 119.15042114257812 	 kl mean: 8.299661636352539 	 loss mean: 127.45008850097656
nll mean: 118.52499389648438 	 kl mean: 8.299661636352539 	 loss mean: 126.82466125488281



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.62it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A

nll mean: 119.15977478027344 	 kl mean: 8.299661636352539 	 loss mean: 127.45943450927734
nll mean: 119.24076843261719 	 kl mean: 8.299661636352539 	 loss mean: 127.5404281616211
nll mean: 118.3464584350586 	 kl mean: 8.299661636352539 	 loss mean: 126.6461181640625



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.04it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.56it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s]
 20%|██        | 2/10 [00:00<00:00, 10.30it/s][A

nll mean: 118.55928039550781 	 kl mean: 8.299661636352539 	 loss mean: 126.85894775390625
nll mean: 160.96463012695312 	 kl mean: 8.84289264678955 	 loss mean: 169.80752563476562
nll mean: 160.77146911621094 	 kl mean: 8.84289264678955 	 loss mean: 169.6143798828125



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.23it/s][A
                                               

nll mean: 161.05819702148438 	 kl mean: 8.84289264678955 	 loss mean: 169.90109252929688
nll mean: 160.7045440673828 	 kl mean: 8.84289264678955 	 loss mean: 169.54745483398438



 34%|███▍      | 13/38 [00:07<00:14,  1.72it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.10it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.72it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.72it/s][A

nll mean: 160.45431518554688 	 kl mean: 8.84289264678955 	 loss mean: 169.29721069335938
nll mean: 160.3060302734375 	 kl mean: 8.84289264678955 	 loss mean: 169.14891052246094
nll mean: 160.74093627929688 	 kl mean: 8.84289264678955 	 loss mean: 169.58383178710938



 70%|███████   | 7/10 [00:00<00:00, 10.09it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.72it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.06it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.72it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.98it/s][A
                                              

nll mean: 160.14450073242188 	 kl mean: 8.84289264678955 	 loss mean: 168.9873809814453
nll mean: 161.05661010742188 	 kl mean: 8.84289264678955 	 loss mean: 169.8994903564453


                                               
100%|██████████| 10/10 [00:00<00:00, 10.05it/s][A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 20%|██        | 2/10 [00:00<00:00, 18.33it/s][A

nll mean: 160.97576904296875 	 kl mean: 8.84289264678955 	 loss mean: 169.81866455078125
nll mean: 135.3972930908203 	 kl mean: 7.922886371612549 	 loss mean: 143.3201904296875
nll mean: 135.396484375 	 kl mean: 7.922886371612549 	 loss mean: 143.31936645507812
nll mean: 135.3428955078125 	 kl mean: 7.922886371612549 	 loss mean: 143.26577758789062


                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 20%|██        | 2/10 [00:00<00:00, 18.33it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 40%|████      | 4/10 [00:00<00:00, 18.07it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 60%|██████    | 6/10 [00:00<00:00, 17.99it/s][A

nll mean: 134.6597900390625 	 kl mean: 7.922886371612549 	 loss mean: 142.58267211914062
nll mean: 135.37164306640625 	 kl mean: 7.922886371612549 	 loss mean: 143.29452514648438
nll mean: 135.86924743652344 	 kl mean: 7.922886371612549 	 loss mean: 143.79214477539062
nll mean: 135.50967407226562 	 kl mean: 7.922886371612549 	 loss mean: 143.4325714111328


                                               
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
 60%|██████    | 6/10 [00:00<00:00, 17.99it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:16,  1.41it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:16,  1.41it/s]
 80%|████████  | 8/10 [00:00<00:00, 17.89it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.83it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 135.5830841064453 	 kl mean: 7.922886371612549 	 loss mean: 143.5059814453125
nll mean: 135.00750732421875 	 kl mean: 7.922886371612549 	 loss mean: 142.930419921875
nll mean: 135.12451171875 	 kl mean: 7.922886371612549 	 loss mean: 143.0474090576172



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s]
 20%|██        | 2/10 [00:00<00:00, 10.77it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A

nll mean: 142.04217529296875 	 kl mean: 8.431138038635254 	 loss mean: 150.4733123779297
nll mean: 142.04168701171875 	 kl mean: 8.431138038635254 	 loss mean: 150.47280883789062
nll mean: 141.98675537109375 	 kl mean: 8.431138038635254 	 loss mean: 150.4178924560547



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.78it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.79it/s][A

nll mean: 142.2677764892578 	 kl mean: 8.431138038635254 	 loss mean: 150.69891357421875
nll mean: 141.84747314453125 	 kl mean: 8.431138038635254 	 loss mean: 150.27859497070312
nll mean: 142.07968139648438 	 kl mean: 8.431138038635254 	 loss mean: 150.51080322265625



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.77it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A

nll mean: 141.47613525390625 	 kl mean: 8.431138038635254 	 loss mean: 149.9072723388672
nll mean: 141.58041381835938 	 kl mean: 8.431138038635254 	 loss mean: 150.0115509033203
nll mean: 142.05752563476562 	 kl mean: 8.431138038635254 	 loss mean: 150.48866271972656



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.51it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.75it/s][A
 42%|████▏     | 16/38 [00:09<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 24.58it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A

nll mean: 141.65875244140625 	 kl mean: 8.431138038635254 	 loss mean: 150.08990478515625
nll mean: 143.577880859375 	 kl mean: 7.986148357391357 	 loss mean: 151.5640411376953
nll mean: 143.22793579101562 	 kl mean: 7.986148357391357 	 loss mean: 151.21409606933594
nll mean: 144.03594970703125 	 kl mean: 7.986148357391357 	 loss mean: 152.0220947265625
nll mean: 143.63023376464844 	 kl mean: 7.986148357391357 	 loss mean: 151.61639404296875



                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.42it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.50it/s][A

nll mean: 143.3687744140625 	 kl mean: 7.986148357391357 	 loss mean: 151.35491943359375
nll mean: 143.90936279296875 	 kl mean: 7.986148357391357 	 loss mean: 151.8955078125
nll mean: 143.89413452148438 	 kl mean: 7.986148357391357 	 loss mean: 151.88027954101562
nll mean: 143.62515258789062 	 kl mean: 7.986148357391357 	 loss mean: 151.6112823486328
nll mean: 143.5713653564453 	 kl mean: 7.986148357391357 	 loss mean: 151.55752563476562



                                               
100%|██████████| 10/10 [00:00<00:00, 24.42it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 25.15it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A


nll mean: 144.0406494140625 	 kl mean: 7.986148357391357 	 loss mean: 152.02679443359375
nll mean: 133.23495483398438 	 kl mean: 8.316202163696289 	 loss mean: 141.5511474609375
nll mean: 133.15328979492188 	 kl mean: 8.316202163696289 	 loss mean: 141.469482421875
nll mean: 133.4019012451172 	 kl mean: 8.316202163696289 	 loss mean: 141.71810913085938
nll mean: 133.66915893554688 	 kl mean: 8.316202163696289 	 loss mean: 141.98538208007812


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.09it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.08it/s][A
                                               

nll mean: 133.49197387695312 	 kl mean: 8.316202163696289 	 loss mean: 141.80816650390625
nll mean: 133.0907745361328 	 kl mean: 8.316202163696289 	 loss mean: 141.406982421875
nll mean: 133.06494140625 	 kl mean: 8.316202163696289 	 loss mean: 141.38113403320312
nll mean: 133.327392578125 	 kl mean: 8.316202163696289 	 loss mean: 141.6436004638672
nll mean: 133.16348266601562 	 kl mean: 8.316202163696289 	 loss mean: 141.47967529296875



100%|██████████| 10/10 [00:00<00:00, 24.99it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 20%|██        | 2/10 [00:00<00:00, 12.22it/s][A

nll mean: 133.1826934814453 	 kl mean: 8.316202163696289 	 loss mean: 141.4989013671875
nll mean: 129.16256713867188 	 kl mean: 8.707242965698242 	 loss mean: 137.86981201171875
nll mean: 129.5389404296875 	 kl mean: 8.707242965698242 	 loss mean: 138.24618530273438
nll mean: 129.36898803710938 	 kl mean: 8.707242965698242 	 loss mean: 138.07623291015625


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 20%|██        | 2/10 [00:00<00:00, 12.22it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 40%|████      | 4/10 [00:00<00:00, 12.34it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.38it/s][A

nll mean: 128.99974060058594 	 kl mean: 8.707242965698242 	 loss mean: 137.70700073242188
nll mean: 129.771484375 	 kl mean: 8.707242965698242 	 loss mean: 138.47872924804688
nll mean: 129.79144287109375 	 kl mean: 8.707242965698242 	 loss mean: 138.49868774414062


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.38it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.37it/s][A

nll mean: 129.09100341796875 	 kl mean: 8.707242965698242 	 loss mean: 137.79824829101562
nll mean: 129.75942993164062 	 kl mean: 8.707242965698242 	 loss mean: 138.46665954589844
nll mean: 129.49090576171875 	 kl mean: 8.707242965698242 	 loss mean: 138.19815063476562


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.75it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.37it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.41it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.45it/s][A

nll mean: 130.2279052734375 	 kl mean: 8.707242965698242 	 loss mean: 138.93515014648438
nll mean: 148.26873779296875 	 kl mean: 8.587648391723633 	 loss mean: 156.85638427734375
nll mean: 148.37486267089844 	 kl mean: 8.587648391723633 	 loss mean: 156.96249389648438


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 12.45it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 40%|████      | 4/10 [00:00<00:00, 12.42it/s][A

nll mean: 147.83470153808594 	 kl mean: 8.587648391723633 	 loss mean: 156.42234802246094
nll mean: 147.4911346435547 	 kl mean: 8.587648391723633 	 loss mean: 156.07879638671875
nll mean: 148.32704162597656 	 kl mean: 8.587648391723633 	 loss mean: 156.91468811035156


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 40%|████      | 4/10 [00:00<00:00, 12.42it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.47it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.42it/s][A

nll mean: 149.0826416015625 	 kl mean: 8.587648391723633 	 loss mean: 157.67030334472656
nll mean: 148.8013916015625 	 kl mean: 8.587648391723633 	 loss mean: 157.3890380859375
nll mean: 148.2371368408203 	 kl mean: 8.587648391723633 	 loss mean: 156.82476806640625


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.42it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.40it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]

nll mean: 148.6068115234375 	 kl mean: 8.587648391723633 	 loss mean: 157.1944580078125
nll mean: 147.80401611328125 	 kl mean: 8.587648391723633 	 loss mean: 156.39166259765625
nll mean: 156.90525817871094 	 kl mean: 8.24184799194336 	 loss mean: 165.1470947265625



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 20%|██        | 2/10 [00:00<00:00, 12.62it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.54it/s][A

nll mean: 156.54022216796875 	 kl mean: 8.24184799194336 	 loss mean: 164.78207397460938
nll mean: 156.75140380859375 	 kl mean: 8.24184799194336 	 loss mean: 164.99327087402344
nll mean: 156.4301300048828 	 kl mean: 8.24184799194336 	 loss mean: 164.67196655273438



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.54it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A

nll mean: 155.84219360351562 	 kl mean: 8.24184799194336 	 loss mean: 164.08401489257812
nll mean: 156.29122924804688 	 kl mean: 8.24184799194336 	 loss mean: 164.53309631347656
nll mean: 156.64859008789062 	 kl mean: 8.24184799194336 	 loss mean: 164.89044189453125



                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.68it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.69it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 156.54144287109375 	 kl mean: 8.24184799194336 	 loss mean: 164.78329467773438
nll mean: 156.0252685546875 	 kl mean: 8.24184799194336 	 loss mean: 164.26712036132812
nll mean: 156.58056640625 	 kl mean: 8.24184799194336 	 loss mean: 164.82241821289062



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 10.34it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A

nll mean: 117.98973846435547 	 kl mean: 8.219862937927246 	 loss mean: 126.2095947265625
nll mean: 117.1663818359375 	 kl mean: 8.219862937927246 	 loss mean: 125.38623809814453
nll mean: 117.40422058105469 	 kl mean: 8.219862937927246 	 loss mean: 125.62408447265625



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.21it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.23it/s][A

nll mean: 117.46452331542969 	 kl mean: 8.219862937927246 	 loss mean: 125.68438720703125
nll mean: 117.86663055419922 	 kl mean: 8.219862937927246 	 loss mean: 126.08648681640625
nll mean: 117.7110595703125 	 kl mean: 8.219862937927246 	 loss mean: 125.9309310913086



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.24it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s][A

nll mean: 117.64423370361328 	 kl mean: 8.219862937927246 	 loss mean: 125.86408996582031
nll mean: 117.94193267822266 	 kl mean: 8.219862937927246 	 loss mean: 126.16178894042969
nll mean: 116.99513244628906 	 kl mean: 8.219862937927246 	 loss mean: 125.21499633789062



                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.21it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 33.08it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A

nll mean: 117.26253509521484 	 kl mean: 8.219862937927246 	 loss mean: 125.48239135742188
nll mean: 106.74710083007812 	 kl mean: 7.422049522399902 	 loss mean: 114.16914367675781
nll mean: 107.02523803710938 	 kl mean: 7.422049522399902 	 loss mean: 114.44729614257812
nll mean: 106.92013549804688 	 kl mean: 7.422049522399902 	 loss mean: 114.34217834472656
nll mean: 107.65255737304688 	 kl mean: 7.422049522399902 	 loss mean: 115.0746078491211
nll mean: 106.97647857666016 	 kl mean: 7.422049522399902 	 loss mean: 114.39852905273438
nll mean: 107.13619232177734 	 kl mean: 7.422049522399902 	 loss mean: 114.55824279785156



                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
 80%|████████  | 8/10 [00:00<00:00, 32.95it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 32.53it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]

nll mean: 107.20298767089844 	 kl mean: 7.422049522399902 	 loss mean: 114.62503051757812
nll mean: 106.86000061035156 	 kl mean: 7.422049522399902 	 loss mean: 114.28205871582031
nll mean: 107.48920440673828 	 kl mean: 7.422049522399902 	 loss mean: 114.9112548828125
nll mean: 106.55889892578125 	 kl mean: 7.422049522399902 	 loss mean: 113.98094940185547
nll mean: 156.44032287597656 	 kl mean: 8.546330451965332 	 loss mean: 164.98666381835938



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.52it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.49it/s][A

nll mean: 156.4226837158203 	 kl mean: 8.546330451965332 	 loss mean: 164.96900939941406
nll mean: 156.2510986328125 	 kl mean: 8.546330451965332 	 loss mean: 164.79742431640625
nll mean: 156.77105712890625 	 kl mean: 8.546330451965332 	 loss mean: 165.31739807128906



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.56it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A

nll mean: 156.64544677734375 	 kl mean: 8.546330451965332 	 loss mean: 165.1917724609375
nll mean: 156.65386962890625 	 kl mean: 8.546330451965332 	 loss mean: 165.2001953125
nll mean: 156.4469757080078 	 kl mean: 8.546330451965332 	 loss mean: 164.99330139160156



                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.57it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.58it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]

nll mean: 156.51397705078125 	 kl mean: 8.546330451965332 	 loss mean: 165.060302734375
nll mean: 156.5089874267578 	 kl mean: 8.546330451965332 	 loss mean: 165.05532836914062
nll mean: 156.2986297607422 	 kl mean: 8.546330451965332 	 loss mean: 164.844970703125
nll mean: 121.0617446899414 	 kl mean: 9.259626388549805 	 loss mean: 130.32138061523438



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 21.82it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.59it/s][A

nll mean: 121.04813385009766 	 kl mean: 9.259626388549805 	 loss mean: 130.30776977539062
nll mean: 120.93557739257812 	 kl mean: 9.259626388549805 	 loss mean: 130.1951904296875
nll mean: 120.57861328125 	 kl mean: 9.259626388549805 	 loss mean: 129.83824157714844
nll mean: 121.32386779785156 	 kl mean: 9.259626388549805 	 loss mean: 130.58349609375
nll mean: 121.22645568847656 	 kl mean: 9.259626388549805 	 loss mean: 130.486083984375



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.42it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.29it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.42207336425781 	 kl mean: 9.259626388549805 	 loss mean: 129.68170166015625
nll mean: 121.29509735107422 	 kl mean: 9.259626388549805 	 loss mean: 130.55471801757812
nll mean: 120.4432144165039 	 kl mean: 9.259626388549805 	 loss mean: 129.70285034179688
nll mean: 120.69941711425781 	 kl mean: 9.259626388549805 	 loss mean: 129.95904541015625



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.72it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s][A

nll mean: 114.3721923828125 	 kl mean: 7.914880275726318 	 loss mean: 122.28707122802734
nll mean: 114.11717224121094 	 kl mean: 7.914880275726318 	 loss mean: 122.03205871582031
nll mean: 113.743896484375 	 kl mean: 7.914880275726318 	 loss mean: 121.65878295898438



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.73it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.66it/s][A

nll mean: 114.11009216308594 	 kl mean: 7.914880275726318 	 loss mean: 122.02497863769531
nll mean: 113.4273681640625 	 kl mean: 7.914880275726318 	 loss mean: 121.34225463867188
nll mean: 113.7457504272461 	 kl mean: 7.914880275726318 	 loss mean: 121.66063690185547



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.68it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A

nll mean: 114.48482513427734 	 kl mean: 7.914880275726318 	 loss mean: 122.39970397949219
nll mean: 113.99508666992188 	 kl mean: 7.914880275726318 	 loss mean: 121.90998077392578
nll mean: 113.98880004882812 	 kl mean: 7.914880275726318 	 loss mean: 121.90367889404297



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.69it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 22.95it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A

nll mean: 113.83505249023438 	 kl mean: 7.914880275726318 	 loss mean: 121.74993133544922
nll mean: 82.99095153808594 	 kl mean: 7.2001752853393555 	 loss mean: 90.19113159179688
nll mean: 82.93168640136719 	 kl mean: 7.2001752853393555 	 loss mean: 90.1318588256836
nll mean: 82.83567810058594 	 kl mean: 7.2001752853393555 	 loss mean: 90.03585815429688
nll mean: 82.16038513183594 	 kl mean: 7.2001752853393555 	 loss mean: 89.36056518554688



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.40it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.27it/s][A

nll mean: 82.21359252929688 	 kl mean: 7.2001752853393555 	 loss mean: 89.41377258300781
nll mean: 83.43508911132812 	 kl mean: 7.2001752853393555 	 loss mean: 90.63526916503906
nll mean: 82.6845703125 	 kl mean: 7.2001752853393555 	 loss mean: 89.8847427368164
nll mean: 83.01887512207031 	 kl mean: 7.2001752853393555 	 loss mean: 90.21905517578125
nll mean: 82.9375 	 kl mean: 7.2001752853393555 	 loss mean: 90.1376724243164



                                               
100%|██████████| 10/10 [00:00<00:00, 22.11it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.42it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s][A

nll mean: 83.56328582763672 	 kl mean: 7.2001752853393555 	 loss mean: 90.76346588134766
nll mean: 108.36572265625 	 kl mean: 7.707820415496826 	 loss mean: 116.07354736328125
nll mean: 108.64673614501953 	 kl mean: 7.707820415496826 	 loss mean: 116.35455322265625
nll mean: 108.86183166503906 	 kl mean: 7.707820415496826 	 loss mean: 116.56965637207031
nll mean: 108.70252990722656 	 kl mean: 7.707820415496826 	 loss mean: 116.41035461425781



                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.49it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.41it/s][A

nll mean: 109.34632873535156 	 kl mean: 7.707820415496826 	 loss mean: 117.05415344238281
nll mean: 108.14276123046875 	 kl mean: 7.707820415496826 	 loss mean: 115.8505859375
nll mean: 108.40680694580078 	 kl mean: 7.707820415496826 	 loss mean: 116.1146240234375
nll mean: 108.61834716796875 	 kl mean: 7.707820415496826 	 loss mean: 116.326171875
nll mean: 109.00885009765625 	 kl mean: 7.707820415496826 	 loss mean: 116.7166748046875



                                               
100%|██████████| 10/10 [00:00<00:00, 21.56it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.61it/s][A

nll mean: 108.6476058959961 	 kl mean: 7.707820415496826 	 loss mean: 116.35542297363281
nll mean: 120.2088394165039 	 kl mean: 8.438324928283691 	 loss mean: 128.6471710205078
nll mean: 119.91517639160156 	 kl mean: 8.438324928283691 	 loss mean: 128.35350036621094



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.64it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A

nll mean: 120.56614685058594 	 kl mean: 8.438324928283691 	 loss mean: 129.00448608398438
nll mean: 120.0845947265625 	 kl mean: 8.438324928283691 	 loss mean: 128.52293395996094
nll mean: 120.16423034667969 	 kl mean: 8.438324928283691 	 loss mean: 128.60255432128906



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.63it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.71it/s][A

nll mean: 120.12222290039062 	 kl mean: 8.438324928283691 	 loss mean: 128.560546875
nll mean: 120.5204086303711 	 kl mean: 8.438324928283691 	 loss mean: 128.958740234375
nll mean: 120.57896423339844 	 kl mean: 8.438324928283691 	 loss mean: 129.0172882080078



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.64it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]

nll mean: 120.06092834472656 	 kl mean: 8.438324928283691 	 loss mean: 128.49925231933594
nll mean: 120.50445556640625 	 kl mean: 8.438324928283691 	 loss mean: 128.94277954101562
nll mean: 61.23801040649414 	 kl mean: 8.678435325622559 	 loss mean: 69.91644287109375



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
 20%|██        | 2/10 [00:00<00:00, 10.43it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.29it/s][A
                                               
 30%|███       | 3/10 [00:00<00:00, 10.29it/s][A

nll mean: 61.86761474609375 	 kl mean: 8.678435325622559 	 loss mean: 70.54605102539062
nll mean: 61.63972473144531 	 kl mean: 8.678435325622559 	 loss mean: 70.31816101074219
nll mean: 61.74158477783203 	 kl mean: 8.678435325622559 	 loss mean: 70.4200210571289


 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.26it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.26it/s][A

nll mean: 61.32719802856445 	 kl mean: 8.678435325622559 	 loss mean: 70.00563049316406
nll mean: 61.431663513183594 	 kl mean: 8.678435325622559 	 loss mean: 70.110107421875
nll mean: 61.968101501464844 	 kl mean: 8.678435325622559 	 loss mean: 70.64653778076172



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.62it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 10.26it/s][A
                                              

nll mean: 61.95772171020508 	 kl mean: 8.678435325622559 	 loss mean: 70.63616180419922
nll mean: 61.46820068359375 	 kl mean: 8.678435325622559 	 loss mean: 70.14663696289062


                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.62it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.18it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 13.33it/s][A

nll mean: 61.14584732055664 	 kl mean: 8.678435325622559 	 loss mean: 69.82427978515625
nll mean: 104.2925033569336 	 kl mean: 7.9986419677734375 	 loss mean: 112.29114532470703
nll mean: 103.752197265625 	 kl mean: 7.9986419677734375 	 loss mean: 111.75084686279297



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.01it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A

nll mean: 103.955078125 	 kl mean: 7.9986419677734375 	 loss mean: 111.95372009277344
nll mean: 104.51505279541016 	 kl mean: 7.9986419677734375 	 loss mean: 112.51368713378906
nll mean: 103.96888732910156 	 kl mean: 7.9986419677734375 	 loss mean: 111.967529296875



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.80it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.68it/s][A

nll mean: 104.5123291015625 	 kl mean: 7.9986419677734375 	 loss mean: 112.5109634399414
nll mean: 104.20525360107422 	 kl mean: 7.9986419677734375 	 loss mean: 112.20389556884766
nll mean: 104.37739562988281 	 kl mean: 7.9986419677734375 	 loss mean: 112.37604522705078



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.55it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.33it/s]
 10%|█         | 1/10 [00:00<00:00,  9.99it/s][A

nll mean: 104.56352996826172 	 kl mean: 7.9986419677734375 	 loss mean: 112.56216430664062
nll mean: 103.84591674804688 	 kl mean: 7.9986419677734375 	 loss mean: 111.84455871582031
nll mean: 137.17098999023438 	 kl mean: 8.973138809204102 	 loss mean: 146.14413452148438



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.93it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A


nll mean: 137.13845825195312 	 kl mean: 8.973138809204102 	 loss mean: 146.11160278320312
nll mean: 137.3981170654297 	 kl mean: 8.973138809204102 	 loss mean: 146.37124633789062
nll mean: 136.12625122070312 	 kl mean: 8.973138809204102 	 loss mean: 145.09938049316406


 40%|████      | 4/10 [00:00<00:00,  9.98it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.95it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.91it/s][A

nll mean: 137.0968475341797 	 kl mean: 8.973138809204102 	 loss mean: 146.06997680664062
nll mean: 137.38644409179688 	 kl mean: 8.973138809204102 	 loss mean: 146.35958862304688



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.91it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.89it/s][A

nll mean: 136.96633911132812 	 kl mean: 8.973138809204102 	 loss mean: 145.93948364257812
nll mean: 138.0565185546875 	 kl mean: 8.973138809204102 	 loss mean: 147.0296630859375



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.87it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.90it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]

nll mean: 137.31747436523438 	 kl mean: 8.973138809204102 	 loss mean: 146.2906036376953
nll mean: 137.19483947753906 	 kl mean: 8.973138809204102 	 loss mean: 146.16796875
nll mean: 63.453086853027344 	 kl mean: 7.592257022857666 	 loss mean: 71.04534912109375
nll mean: 63.150672912597656 	 kl mean: 7.592257022857666 	 loss mean: 70.74293518066406



                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
 30%|███       | 3/10 [00:00<00:00, 25.91it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.65it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A

nll mean: 62.876155853271484 	 kl mean: 7.592257022857666 	 loss mean: 70.46841430664062
nll mean: 63.551815032958984 	 kl mean: 7.592257022857666 	 loss mean: 71.14407348632812
nll mean: 63.327003479003906 	 kl mean: 7.592257022857666 	 loss mean: 70.91926574707031
nll mean: 62.75181579589844 	 kl mean: 7.592257022857666 	 loss mean: 70.34407043457031
nll mean: 63.17655944824219 	 kl mean: 7.592257022857666 	 loss mean: 70.76881408691406
nll mean: 62.925994873046875 	 kl mean: 7.592257022857666 	 loss mean: 70.51825714111328



                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.53it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.38it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 30%|███       | 3/10 [00:00<00:00, 21.73it/s][A

nll mean: 62.93942642211914 	 kl mean: 7.592257022857666 	 loss mean: 70.53168487548828
nll mean: 62.729949951171875 	 kl mean: 7.592257022857666 	 loss mean: 70.32220458984375
nll mean: 117.90908813476562 	 kl mean: 7.806397438049316 	 loss mean: 125.71548461914062
nll mean: 118.49057006835938 	 kl mean: 7.806397438049316 	 loss mean: 126.29696655273438
nll mean: 118.00991821289062 	 kl mean: 7.806397438049316 	 loss mean: 125.81631469726562



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.61it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A

nll mean: 117.94932556152344 	 kl mean: 7.806397438049316 	 loss mean: 125.75572204589844
nll mean: 117.74433898925781 	 kl mean: 7.806397438049316 	 loss mean: 125.55073547363281
nll mean: 117.86787414550781 	 kl mean: 7.806397438049316 	 loss mean: 125.67427062988281
nll mean: 118.23394775390625 	 kl mean: 7.806397438049316 	 loss mean: 126.04033660888672
nll mean: 118.18937683105469 	 kl mean: 7.806397438049316 	 loss mean: 125.99578094482422



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.66it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.63it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]

nll mean: 118.21356201171875 	 kl mean: 7.806397438049316 	 loss mean: 126.01997375488281
nll mean: 117.62242889404297 	 kl mean: 7.806397438049316 	 loss mean: 125.42882537841797
nll mean: 119.41934204101562 	 kl mean: 8.167562484741211 	 loss mean: 127.5869140625



                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 12.86it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.87it/s][A

nll mean: 120.3305892944336 	 kl mean: 8.167562484741211 	 loss mean: 128.49813842773438
nll mean: 119.81978607177734 	 kl mean: 8.167562484741211 	 loss mean: 127.98735046386719
nll mean: 120.0172119140625 	 kl mean: 8.167562484741211 	 loss mean: 128.1847686767578



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.70it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A

nll mean: 119.88740539550781 	 kl mean: 8.167562484741211 	 loss mean: 128.05496215820312
nll mean: 120.28083801269531 	 kl mean: 8.167562484741211 	 loss mean: 128.44839477539062
nll mean: 120.19841766357422 	 kl mean: 8.167562484741211 	 loss mean: 128.36598205566406



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.61it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.55it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 119.99285888671875 	 kl mean: 8.167562484741211 	 loss mean: 128.16041564941406
nll mean: 119.65178680419922 	 kl mean: 8.167562484741211 	 loss mean: 127.81934356689453
nll mean: 120.05235290527344 	 kl mean: 8.167562484741211 	 loss mean: 128.21990966796875



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s]
 20%|██        | 2/10 [00:00<00:00, 10.70it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s][A

nll mean: 113.4328842163086 	 kl mean: 7.977282524108887 	 loss mean: 121.41017150878906
nll mean: 112.8851318359375 	 kl mean: 7.977282524108887 	 loss mean: 120.86241912841797
nll mean: 112.91590881347656 	 kl mean: 7.977282524108887 	 loss mean: 120.8931884765625



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.63it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.65it/s][A

nll mean: 113.42514038085938 	 kl mean: 7.977282524108887 	 loss mean: 121.40242767333984
nll mean: 113.01034545898438 	 kl mean: 7.977282524108887 	 loss mean: 120.98762512207031
nll mean: 113.37130737304688 	 kl mean: 7.977282524108887 	 loss mean: 121.34859466552734



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.65it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s][A

nll mean: 112.54095458984375 	 kl mean: 7.977282524108887 	 loss mean: 120.51823425292969
nll mean: 113.11634826660156 	 kl mean: 7.977282524108887 	 loss mean: 121.0936279296875
nll mean: 113.00035095214844 	 kl mean: 7.977282524108887 	 loss mean: 120.97764587402344



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.63it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00, 21.94it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A

nll mean: 113.15275573730469 	 kl mean: 7.977282524108887 	 loss mean: 121.13003540039062
nll mean: 110.9912338256836 	 kl mean: 8.229238510131836 	 loss mean: 119.22047424316406
nll mean: 110.58313751220703 	 kl mean: 8.229238510131836 	 loss mean: 118.8123779296875
nll mean: 110.63568115234375 	 kl mean: 8.229238510131836 	 loss mean: 118.86492919921875
nll mean: 111.25884246826172 	 kl mean: 8.229238510131836 	 loss mean: 119.48808288574219



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.66it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.52it/s][A

nll mean: 110.60733032226562 	 kl mean: 8.229238510131836 	 loss mean: 118.83657836914062
nll mean: 110.49447631835938 	 kl mean: 8.229238510131836 	 loss mean: 118.72370910644531
nll mean: 110.5135498046875 	 kl mean: 8.229238510131836 	 loss mean: 118.74279022216797
nll mean: 111.13076782226562 	 kl mean: 8.229238510131836 	 loss mean: 119.36001586914062
nll mean: 111.1756591796875 	 kl mean: 8.229238510131836 	 loss mean: 119.40489959716797



                                               
100%|██████████| 10/10 [00:00<00:00, 21.44it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 30.91it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A

nll mean: 110.90565490722656 	 kl mean: 8.229238510131836 	 loss mean: 119.13490295410156
nll mean: 84.17762756347656 	 kl mean: 8.726934432983398 	 loss mean: 92.9045639038086
nll mean: 84.50514221191406 	 kl mean: 8.726934432983398 	 loss mean: 93.2320785522461
nll mean: 84.10531616210938 	 kl mean: 8.726934432983398 	 loss mean: 92.83226013183594
nll mean: 84.57762908935547 	 kl mean: 8.726934432983398 	 loss mean: 93.3045654296875
nll mean: 84.48407745361328 	 kl mean: 8.726934432983398 	 loss mean: 93.21101379394531
nll mean: 84.21156311035156 	 kl mean: 8.726934432983398 	 loss mean: 92.9384994506836



                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
 80%|████████  | 8/10 [00:00<00:00, 30.71it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 30.53it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.57it/s]


nll mean: 83.90499877929688 	 kl mean: 8.726934432983398 	 loss mean: 92.63191986083984
nll mean: 84.53094482421875 	 kl mean: 8.726934432983398 	 loss mean: 93.25787353515625
nll mean: 85.29853820800781 	 kl mean: 8.726934432983398 	 loss mean: 94.02547454833984
nll mean: 84.55955505371094 	 kl mean: 8.726934432983398 	 loss mean: 93.28649139404297
Approximate NLL:
tensor(120.9791, device='cuda:0')
Approximate KL:
tensor(8.2716, device='cuda:0')
Testing took 0:00:25.249432


  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 25.78it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].78it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].78it/s][A

nll mean: 110.21690368652344 	 kl mean: 8.723892211914062 	 loss mean: 118.9407958984375
nll mean: 109.80769348144531 	 kl mean: 8.723892211914062 	 loss mean: 118.53158569335938
nll mean: 109.92454528808594 	 kl mean: 8.723892211914062 	 loss mean: 118.6484375
nll mean: 110.09913635253906 	 kl mean: 8.723892211914062 	 loss mean: 118.82302856445312
nll mean: 110.04423522949219 	 kl mean: 8.723892211914062 	 loss mean: 118.76812744140625



                                              
  0%|          | 0/38 [00:00<?, ?it/s].78it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.44it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].44it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].44it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].44it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.19it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 24.93it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 110.12335205078125 	 kl mean: 8.723892211914062 	 loss mean: 118.84725952148438
nll mean: 109.85230255126953 	 kl mean: 8.723892211914062 	 loss mean: 118.57620239257812
nll mean: 110.24195098876953 	 kl mean: 8.723892211914062 	 loss mean: 118.96583557128906
nll mean: 109.50312805175781 	 kl mean: 8.723892211914062 	 loss mean: 118.22700500488281
nll mean: 109.95880889892578 	 kl mean: 8.723892211914062 	 loss mean: 118.68270111083984



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
 20%|██        | 2/10 [00:00<00:00, 14.18it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s][A

nll mean: 127.24237823486328 	 kl mean: 8.589604377746582 	 loss mean: 135.83200073242188
nll mean: 127.41209411621094 	 kl mean: 8.589604377746582 	 loss mean: 136.001708984375
nll mean: 127.29177856445312 	 kl mean: 8.589604377746582 	 loss mean: 135.8813934326172



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.01it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.05it/s][A

nll mean: 127.37117767333984 	 kl mean: 8.589604377746582 	 loss mean: 135.96078491210938
nll mean: 127.44345092773438 	 kl mean: 8.589604377746582 	 loss mean: 136.03305053710938
nll mean: 126.7747573852539 	 kl mean: 8.589604377746582 	 loss mean: 135.36436462402344



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.08it/s][A
                                              
  3%|▎         | 1/38 [00:01<00:14,  2.48it/s][A

nll mean: 127.14385223388672 	 kl mean: 8.589604377746582 	 loss mean: 135.73345947265625
nll mean: 127.23027801513672 	 kl mean: 8.589604377746582 	 loss mean: 135.81988525390625
nll mean: 127.01399230957031 	 kl mean: 8.589604377746582 	 loss mean: 135.6035919189453



                                              
  3%|▎         | 1/38 [00:01<00:14,  2.48it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.04it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 24.97it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A

nll mean: 127.346923828125 	 kl mean: 8.589604377746582 	 loss mean: 135.9365234375
nll mean: 98.43821716308594 	 kl mean: 8.139363288879395 	 loss mean: 106.57758331298828
nll mean: 98.28024291992188 	 kl mean: 8.139363288879395 	 loss mean: 106.41960906982422
nll mean: 99.22089385986328 	 kl mean: 8.139363288879395 	 loss mean: 107.36026000976562
nll mean: 99.10404968261719 	 kl mean: 8.139363288879395 	 loss mean: 107.243408203125



                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.91it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.81it/s][A

nll mean: 98.13970947265625 	 kl mean: 8.139363288879395 	 loss mean: 106.27906799316406
nll mean: 98.2005615234375 	 kl mean: 8.139363288879395 	 loss mean: 106.33992004394531
nll mean: 98.74942779541016 	 kl mean: 8.139363288879395 	 loss mean: 106.8887939453125
nll mean: 98.72210693359375 	 kl mean: 8.139363288879395 	 loss mean: 106.86146545410156
nll mean: 98.52802276611328 	 kl mean: 8.139363288879395 	 loss mean: 106.6673812866211



                                              
100%|██████████| 10/10 [00:00<00:00, 24.71it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
 20%|██        | 2/10 [00:00<00:00, 10.76it/s][A

nll mean: 98.06254577636719 	 kl mean: 8.139363288879395 	 loss mean: 106.20191192626953
nll mean: 137.559326171875 	 kl mean: 8.19878101348877 	 loss mean: 145.7581024169922
nll mean: 137.82293701171875 	 kl mean: 8.19878101348877 	 loss mean: 146.02171325683594



                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.81it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s][A

nll mean: 138.1260986328125 	 kl mean: 8.19878101348877 	 loss mean: 146.32485961914062
nll mean: 137.358154296875 	 kl mean: 8.19878101348877 	 loss mean: 145.5569305419922
nll mean: 137.85940551757812 	 kl mean: 8.19878101348877 	 loss mean: 146.0581817626953



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.82it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.85it/s][A

nll mean: 138.05496215820312 	 kl mean: 8.19878101348877 	 loss mean: 146.2537384033203
nll mean: 138.10076904296875 	 kl mean: 8.19878101348877 	 loss mean: 146.299560546875
nll mean: 138.16903686523438 	 kl mean: 8.19878101348877 	 loss mean: 146.36781311035156



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.84it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]

nll mean: 138.14231872558594 	 kl mean: 8.19878101348877 	 loss mean: 146.3411102294922
nll mean: 138.05953979492188 	 kl mean: 8.19878101348877 	 loss mean: 146.25830078125
nll mean: 125.28761291503906 	 kl mean: 7.890483856201172 	 loss mean: 133.1781005859375



                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 13.85it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.88it/s][A

nll mean: 124.84043884277344 	 kl mean: 7.890483856201172 	 loss mean: 132.73092651367188
nll mean: 125.26112365722656 	 kl mean: 7.890483856201172 	 loss mean: 133.151611328125
nll mean: 125.1878662109375 	 kl mean: 7.890483856201172 	 loss mean: 133.07835388183594



                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.85it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A

nll mean: 125.60337829589844 	 kl mean: 7.890483856201172 	 loss mean: 133.49386596679688
nll mean: 125.54559326171875 	 kl mean: 7.890483856201172 	 loss mean: 133.4360809326172
nll mean: 124.73477172851562 	 kl mean: 7.890483856201172 	 loss mean: 132.625244140625



                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.93it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.98it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 125.55744171142578 	 kl mean: 7.890483856201172 	 loss mean: 133.4479217529297
nll mean: 125.61445617675781 	 kl mean: 7.890483856201172 	 loss mean: 133.50494384765625
nll mean: 125.3216781616211 	 kl mean: 7.890483856201172 	 loss mean: 133.21217346191406



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.07it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 123.94866943359375 	 kl mean: 7.806136131286621 	 loss mean: 131.7548065185547
nll mean: 123.48660278320312 	 kl mean: 7.806136131286621 	 loss mean: 131.29273986816406
nll mean: 123.5419921875 	 kl mean: 7.806136131286621 	 loss mean: 131.34812927246094



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.14it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.09it/s][A

nll mean: 123.41470336914062 	 kl mean: 7.806136131286621 	 loss mean: 131.22084045410156
nll mean: 123.3435287475586 	 kl mean: 7.806136131286621 	 loss mean: 131.149658203125
nll mean: 123.55506134033203 	 kl mean: 7.806136131286621 	 loss mean: 131.36119079589844



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.14it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 123.58395385742188 	 kl mean: 7.806136131286621 	 loss mean: 131.39007568359375
nll mean: 123.63218688964844 	 kl mean: 7.806136131286621 	 loss mean: 131.43832397460938
nll mean: 123.87872314453125 	 kl mean: 7.806136131286621 	 loss mean: 131.68487548828125



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.14it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.57it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A

nll mean: 123.75247192382812 	 kl mean: 7.806136131286621 	 loss mean: 131.55860900878906
nll mean: 132.9710693359375 	 kl mean: 7.966771125793457 	 loss mean: 140.93783569335938
nll mean: 132.59446716308594 	 kl mean: 7.966771125793457 	 loss mean: 140.5612335205078
nll mean: 132.76002502441406 	 kl mean: 7.966771125793457 	 loss mean: 140.726806640625
nll mean: 132.8791046142578 	 kl mean: 7.966771125793457 	 loss mean: 140.84588623046875



                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.31it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.16it/s][A
                                              

nll mean: 132.7381591796875 	 kl mean: 7.966771125793457 	 loss mean: 140.70492553710938
nll mean: 132.89431762695312 	 kl mean: 7.966771125793457 	 loss mean: 140.861083984375
nll mean: 132.90811157226562 	 kl mean: 7.966771125793457 	 loss mean: 140.87490844726562
nll mean: 132.54122924804688 	 kl mean: 7.966771125793457 	 loss mean: 140.5080108642578
nll mean: 132.92724609375 	 kl mean: 7.966771125793457 	 loss mean: 140.89401245117188


                                              
100%|██████████| 10/10 [00:00<00:00, 24.99it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 24.85it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A

nll mean: 132.94296264648438 	 kl mean: 7.966771125793457 	 loss mean: 140.90972900390625
nll mean: 106.41959381103516 	 kl mean: 7.816275596618652 	 loss mean: 114.23587036132812
nll mean: 106.51638793945312 	 kl mean: 7.816275596618652 	 loss mean: 114.3326644897461
nll mean: 106.34005737304688 	 kl mean: 7.816275596618652 	 loss mean: 114.15632629394531
nll mean: 105.88134765625 	 kl mean: 7.816275596618652 	 loss mean: 113.69762420654297



                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.77it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.73it/s][A

nll mean: 106.35221862792969 	 kl mean: 7.816275596618652 	 loss mean: 114.16848754882812
nll mean: 105.83154296875 	 kl mean: 7.816275596618652 	 loss mean: 113.64781188964844
nll mean: 105.88957214355469 	 kl mean: 7.816275596618652 	 loss mean: 113.70584106445312
nll mean: 105.70478820800781 	 kl mean: 7.816275596618652 	 loss mean: 113.52107238769531
nll mean: 105.92848205566406 	 kl mean: 7.816275596618652 	 loss mean: 113.7447509765625



                                              
100%|██████████| 10/10 [00:00<00:00, 24.68it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
 20%|██        | 2/10 [00:00<00:00, 14.65it/s][A

nll mean: 107.11752319335938 	 kl mean: 7.816275596618652 	 loss mean: 114.93380737304688
nll mean: 132.47508239746094 	 kl mean: 8.461917877197266 	 loss mean: 140.93699645996094
nll mean: 131.9254150390625 	 kl mean: 8.461917877197266 	 loss mean: 140.3873291015625



                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.90it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
 60%|██████    | 6/10 [00:00<00:00, 15.12it/s][A

nll mean: 132.5439910888672 	 kl mean: 8.461917877197266 	 loss mean: 141.0059051513672
nll mean: 132.44393920898438 	 kl mean: 8.461917877197266 	 loss mean: 140.90585327148438
nll mean: 132.01312255859375 	 kl mean: 8.461917877197266 	 loss mean: 140.4750518798828
nll mean: 133.01449584960938 	 kl mean: 8.461917877197266 	 loss mean: 141.47640991210938



                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
 80%|████████  | 8/10 [00:00<00:00, 15.07it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
100%|██████████| 10/10 [00:00<00:00, 15.21it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]


nll mean: 131.95736694335938 	 kl mean: 8.461917877197266 	 loss mean: 140.41928100585938
nll mean: 132.67019653320312 	 kl mean: 8.461917877197266 	 loss mean: 141.1321258544922
nll mean: 131.74130249023438 	 kl mean: 8.461917877197266 	 loss mean: 140.20321655273438
nll mean: 132.21630859375 	 kl mean: 8.461917877197266 	 loss mean: 140.67822265625


  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s]
 30%|███       | 3/10 [00:00<00:00, 20.52it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A

nll mean: 131.2265625 	 kl mean: 8.148530960083008 	 loss mean: 139.37509155273438
nll mean: 131.1649932861328 	 kl mean: 8.148530960083008 	 loss mean: 139.3135223388672
nll mean: 130.74884033203125 	 kl mean: 8.148530960083008 	 loss mean: 138.89736938476562
nll mean: 131.19012451171875 	 kl mean: 8.148530960083008 	 loss mean: 139.33865356445312
nll mean: 131.2128143310547 	 kl mean: 8.148530960083008 	 loss mean: 139.36135864257812



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
 60%|██████    | 6/10 [00:00<00:00, 20.53it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.76it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 20.79it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 20.82it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 130.93319702148438 	 kl mean: 8.148530960083008 	 loss mean: 139.08172607421875
nll mean: 131.34158325195312 	 kl mean: 8.148530960083008 	 loss mean: 139.49014282226562
nll mean: 131.32257080078125 	 kl mean: 8.148530960083008 	 loss mean: 139.47109985351562
nll mean: 130.82249450683594 	 kl mean: 8.148530960083008 	 loss mean: 138.9710235595703
nll mean: 131.5801239013672 	 kl mean: 8.148530960083008 	 loss mean: 139.7286376953125



                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
 30%|███       | 3/10 [00:00<00:00, 25.07it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s][A
                                               
 30%|███       | 3/10 [00:00<00:00, 25.07it/s]

nll mean: 118.67205810546875 	 kl mean: 8.124723434448242 	 loss mean: 126.7967758178711
nll mean: 118.58772277832031 	 kl mean: 8.124723434448242 	 loss mean: 126.71243286132812
nll mean: 118.59002685546875 	 kl mean: 8.124723434448242 	 loss mean: 126.71475219726562
nll mean: 118.68394470214844 	 kl mean: 8.124723434448242 	 loss mean: 126.80867004394531
nll mean: 118.56492614746094 	 kl mean: 8.124723434448242 	 loss mean: 126.68965911865234
nll mean: 118.89590454101562 	 kl mean: 8.124723434448242 	 loss mean: 127.0206298828125


 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.99it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.91it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 24.83it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]

nll mean: 119.34248352050781 	 kl mean: 8.124723434448242 	 loss mean: 127.46720886230469
nll mean: 118.71015167236328 	 kl mean: 8.124723434448242 	 loss mean: 126.83486938476562
nll mean: 118.65362548828125 	 kl mean: 8.124723434448242 	 loss mean: 126.7783432006836
nll mean: 118.39605712890625 	 kl mean: 8.124723434448242 	 loss mean: 126.5207748413086
nll mean: 140.85255432128906 	 kl mean: 8.330364227294922 	 loss mean: 149.18292236328125



                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 30%|███       | 3/10 [00:00<00:00, 21.51it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.48it/s][A

nll mean: 140.73629760742188 	 kl mean: 8.330364227294922 	 loss mean: 149.066650390625
nll mean: 141.44729614257812 	 kl mean: 8.330364227294922 	 loss mean: 149.7776641845703
nll mean: 140.88409423828125 	 kl mean: 8.330364227294922 	 loss mean: 149.21444702148438
nll mean: 140.82888793945312 	 kl mean: 8.330364227294922 	 loss mean: 149.15924072265625
nll mean: 140.96678161621094 	 kl mean: 8.330364227294922 	 loss mean: 149.29714965820312



                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.40it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.30it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 141.165771484375 	 kl mean: 8.330364227294922 	 loss mean: 149.4961395263672
nll mean: 141.32168579101562 	 kl mean: 8.330364227294922 	 loss mean: 149.65206909179688
nll mean: 141.0836944580078 	 kl mean: 8.330364227294922 	 loss mean: 149.4140625
nll mean: 141.57354736328125 	 kl mean: 8.330364227294922 	 loss mean: 149.90391540527344



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
 20%|██        | 2/10 [00:00<00:00, 12.50it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s][A

nll mean: 120.35603332519531 	 kl mean: 8.148321151733398 	 loss mean: 128.50436401367188
nll mean: 120.32205963134766 	 kl mean: 8.148321151733398 	 loss mean: 128.4703826904297
nll mean: 119.474365234375 	 kl mean: 8.148321151733398 	 loss mean: 127.6226806640625



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.62it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.55it/s][A

nll mean: 119.59822082519531 	 kl mean: 8.148321151733398 	 loss mean: 127.74654388427734
nll mean: 119.79136657714844 	 kl mean: 8.148321151733398 	 loss mean: 127.93968963623047
nll mean: 120.02328491210938 	 kl mean: 8.148321151733398 	 loss mean: 128.17161560058594



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.55it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A

nll mean: 120.281982421875 	 kl mean: 8.148321151733398 	 loss mean: 128.4302978515625
nll mean: 120.47427368164062 	 kl mean: 8.148321151733398 	 loss mean: 128.6226043701172
nll mean: 120.38395690917969 	 kl mean: 8.148321151733398 	 loss mean: 128.53228759765625



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.58it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 10%|█         | 1/10 [00:00<00:00,  9.79it/s][A

nll mean: 119.8790283203125 	 kl mean: 8.148321151733398 	 loss mean: 128.02734375
nll mean: 159.5039825439453 	 kl mean: 9.150245666503906 	 loss mean: 168.6542205810547



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.79it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.82it/s][A


nll mean: 159.12411499023438 	 kl mean: 9.150245666503906 	 loss mean: 168.27435302734375
nll mean: 158.89666748046875 	 kl mean: 9.150245666503906 	 loss mean: 168.04690551757812


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.86it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.90it/s][A
                                              

nll mean: 159.21896362304688 	 kl mean: 9.150245666503906 	 loss mean: 168.36920166015625
nll mean: 158.90379333496094 	 kl mean: 9.150245666503906 	 loss mean: 168.05404663085938


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.89it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.90it/s][A
[A                                           

nll mean: 159.33026123046875 	 kl mean: 9.150245666503906 	 loss mean: 168.48052978515625
nll mean: 158.78892517089844 	 kl mean: 9.150245666503906 	 loss mean: 167.93917846679688


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.90it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.90it/s][A

nll mean: 159.76483154296875 	 kl mean: 9.150245666503906 	 loss mean: 168.91510009765625
nll mean: 158.931396484375 	 kl mean: 9.150245666503906 	 loss mean: 168.08163452148438



                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.89it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.00it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A

nll mean: 159.57232666015625 	 kl mean: 9.150245666503906 	 loss mean: 168.72256469726562
nll mean: 134.75509643554688 	 kl mean: 8.019814491271973 	 loss mean: 142.77493286132812
nll mean: 135.21807861328125 	 kl mean: 8.019814491271973 	 loss mean: 143.23788452148438
nll mean: 134.72152709960938 	 kl mean: 8.019814491271973 	 loss mean: 142.7413330078125



                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 40%|████      | 4/10 [00:00<00:00, 17.90it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 60%|██████    | 6/10 [00:00<00:00, 17.91it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A

nll mean: 134.57713317871094 	 kl mean: 8.019814491271973 	 loss mean: 142.59695434570312
nll mean: 134.03009033203125 	 kl mean: 8.019814491271973 	 loss mean: 142.04991149902344
nll mean: 134.5906982421875 	 kl mean: 8.019814491271973 	 loss mean: 142.61050415039062
nll mean: 134.31764221191406 	 kl mean: 8.019814491271973 	 loss mean: 142.33746337890625



                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 80%|████████  | 8/10 [00:00<00:00, 17.85it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.82it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 134.2737274169922 	 kl mean: 8.019814491271973 	 loss mean: 142.2935333251953
nll mean: 134.58163452148438 	 kl mean: 8.019814491271973 	 loss mean: 142.6014404296875
nll mean: 134.718994140625 	 kl mean: 8.019814491271973 	 loss mean: 142.73880004882812


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 20%|██        | 2/10 [00:00<00:00, 10.74it/s][A

nll mean: 143.41595458984375 	 kl mean: 8.300817489624023 	 loss mean: 151.71676635742188
nll mean: 143.36715698242188 	 kl mean: 8.300817489624023 	 loss mean: 151.66796875
nll mean: 144.163330078125 	 kl mean: 8.300817489624023 	 loss mean: 152.46414184570312


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 20%|██        | 2/10 [00:00<00:00, 10.74it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 40%|████      | 4/10 [00:00<00:00, 10.78it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.75it/s][A

nll mean: 143.70416259765625 	 kl mean: 8.300817489624023 	 loss mean: 152.00497436523438
nll mean: 143.40121459960938 	 kl mean: 8.300817489624023 	 loss mean: 151.7020263671875
nll mean: 143.07138061523438 	 kl mean: 8.300817489624023 	 loss mean: 151.37220764160156


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.75it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.69it/s][A

nll mean: 142.781005859375 	 kl mean: 8.300817489624023 	 loss mean: 151.0818328857422
nll mean: 143.113037109375 	 kl mean: 8.300817489624023 	 loss mean: 151.41384887695312
nll mean: 143.46298217773438 	 kl mean: 8.300817489624023 	 loss mean: 151.7637939453125


                                               
 39%|███▉      | 15/38 [00:10<00:15,  1.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.69it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.63it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 23.89it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A

nll mean: 144.02821350097656 	 kl mean: 8.300817489624023 	 loss mean: 152.3290252685547
nll mean: 142.75856018066406 	 kl mean: 8.141156196594238 	 loss mean: 150.89971923828125
nll mean: 143.1020965576172 	 kl mean: 8.141156196594238 	 loss mean: 151.2432403564453
nll mean: 142.69873046875 	 kl mean: 8.141156196594238 	 loss mean: 150.8398895263672
nll mean: 143.32070922851562 	 kl mean: 8.141156196594238 	 loss mean: 151.46185302734375



                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
 60%|██████    | 6/10 [00:00<00:00, 23.68it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 23.64it/s][A

nll mean: 142.60523986816406 	 kl mean: 8.141156196594238 	 loss mean: 150.74639892578125
nll mean: 143.32867431640625 	 kl mean: 8.141156196594238 	 loss mean: 151.46983337402344
nll mean: 143.17164611816406 	 kl mean: 8.141156196594238 	 loss mean: 151.3127899169922
nll mean: 142.7604522705078 	 kl mean: 8.141156196594238 	 loss mean: 150.90159606933594
nll mean: 142.84848022460938 	 kl mean: 8.141156196594238 	 loss mean: 150.9896240234375



                                               
100%|██████████| 10/10 [00:00<00:00, 23.63it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
 30%|███       | 3/10 [00:00<00:00, 24.67it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s][A

nll mean: 143.43870544433594 	 kl mean: 8.141156196594238 	 loss mean: 151.57986450195312
nll mean: 133.55453491210938 	 kl mean: 8.221771240234375 	 loss mean: 141.77630615234375
nll mean: 133.55484008789062 	 kl mean: 8.221771240234375 	 loss mean: 141.77662658691406
nll mean: 134.45265197753906 	 kl mean: 8.221771240234375 	 loss mean: 142.6744384765625
nll mean: 134.1062469482422 	 kl mean: 8.221771240234375 	 loss mean: 142.32803344726562



                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.38it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.15it/s][A

nll mean: 134.21621704101562 	 kl mean: 8.221771240234375 	 loss mean: 142.43798828125
nll mean: 134.16854858398438 	 kl mean: 8.221771240234375 	 loss mean: 142.39031982421875
nll mean: 133.8347625732422 	 kl mean: 8.221771240234375 	 loss mean: 142.0565185546875
nll mean: 134.1802520751953 	 kl mean: 8.221771240234375 	 loss mean: 142.4020233154297
nll mean: 134.305419921875 	 kl mean: 8.221771240234375 	 loss mean: 142.52719116210938



                                               
100%|██████████| 10/10 [00:00<00:00, 23.93it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.71it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.71it/s]
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.50it/s][A

nll mean: 134.12355041503906 	 kl mean: 8.221771240234375 	 loss mean: 142.34532165527344
nll mean: 130.16201782226562 	 kl mean: 8.721571922302246 	 loss mean: 138.88360595703125
nll mean: 130.22525024414062 	 kl mean: 8.721571922302246 	 loss mean: 138.9468231201172


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.71it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.71it/s]
 20%|██        | 2/10 [00:00<00:00, 12.50it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.71it/s]
 40%|████      | 4/10 [00:00<00:00, 12.55it/s][A

nll mean: 129.605224609375 	 kl mean: 8.721571922302246 	 loss mean: 138.3267822265625
nll mean: 129.76266479492188 	 kl mean: 8.721571922302246 	 loss mean: 138.48422241210938
nll mean: 129.64776611328125 	 kl mean: 8.721571922302246 	 loss mean: 138.36932373046875


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.71it/s]
 40%|████      | 4/10 [00:00<00:00, 12.55it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.71it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.47it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.40it/s][A

nll mean: 130.47509765625 	 kl mean: 8.721571922302246 	 loss mean: 139.1966552734375
nll mean: 129.9452667236328 	 kl mean: 8.721571922302246 	 loss mean: 138.66683959960938
nll mean: 129.67156982421875 	 kl mean: 8.721571922302246 	 loss mean: 138.39315795898438


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.71it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.71it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.40it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.40it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s]

nll mean: 129.75128173828125 	 kl mean: 8.721571922302246 	 loss mean: 138.47286987304688
nll mean: 129.72784423828125 	 kl mean: 8.721571922302246 	 loss mean: 138.4494171142578
nll mean: 147.1883087158203 	 kl mean: 8.465097427368164 	 loss mean: 155.65341186523438



                                               
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s]
 20%|██        | 2/10 [00:00<00:00, 12.63it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.55it/s][A

nll mean: 147.80291748046875 	 kl mean: 8.465097427368164 	 loss mean: 156.26800537109375
nll mean: 147.69970703125 	 kl mean: 8.465097427368164 	 loss mean: 156.16482543945312
nll mean: 147.6531219482422 	 kl mean: 8.465097427368164 	 loss mean: 156.1182098388672



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.48it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s][A

nll mean: 147.96690368652344 	 kl mean: 8.465097427368164 	 loss mean: 156.43199157714844
nll mean: 147.42227172851562 	 kl mean: 8.465097427368164 	 loss mean: 155.88739013671875
nll mean: 147.5616455078125 	 kl mean: 8.465097427368164 	 loss mean: 156.02674865722656



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.49it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.38it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 147.25331115722656 	 kl mean: 8.465097427368164 	 loss mean: 155.71839904785156
nll mean: 148.02542114257812 	 kl mean: 8.465097427368164 	 loss mean: 156.49050903320312
nll mean: 147.77671813964844 	 kl mean: 8.465097427368164 	 loss mean: 156.24180603027344



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.43it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.43it/s]
 20%|██        | 2/10 [00:00<00:00, 12.66it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.43it/s][A

nll mean: 156.11083984375 	 kl mean: 8.16487979888916 	 loss mean: 164.27572631835938
nll mean: 156.63958740234375 	 kl mean: 8.16487979888916 	 loss mean: 164.80445861816406
nll mean: 156.9061737060547 	 kl mean: 8.16487979888916 	 loss mean: 165.07106018066406



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.43it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.54it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.43it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.43it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.53it/s][A

nll mean: 156.5649871826172 	 kl mean: 8.16487979888916 	 loss mean: 164.7298583984375
nll mean: 157.43994140625 	 kl mean: 8.16487979888916 	 loss mean: 165.60482788085938
nll mean: 156.2291717529297 	 kl mean: 8.16487979888916 	 loss mean: 164.39405822753906



                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.43it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.43it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.47it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.43it/s][A

nll mean: 155.82118225097656 	 kl mean: 8.16487979888916 	 loss mean: 163.98605346679688
nll mean: 156.972412109375 	 kl mean: 8.16487979888916 	 loss mean: 165.13729858398438
nll mean: 157.10446166992188 	 kl mean: 8.16487979888916 	 loss mean: 165.26934814453125



                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.43it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.41it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]


nll mean: 156.60597229003906 	 kl mean: 8.16487979888916 	 loss mean: 164.77084350585938
nll mean: 117.55096435546875 	 kl mean: 8.389556884765625 	 loss mean: 125.94051361083984


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 10.08it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.01it/s][A
                                              

nll mean: 117.59611511230469 	 kl mean: 8.389556884765625 	 loss mean: 125.98566436767578
nll mean: 117.50475311279297 	 kl mean: 8.389556884765625 	 loss mean: 125.89430236816406


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.00it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.97it/s][A
                                               

nll mean: 117.13208770751953 	 kl mean: 8.389556884765625 	 loss mean: 125.52165222167969
nll mean: 117.21112060546875 	 kl mean: 8.389556884765625 	 loss mean: 125.60067749023438



 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.02it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s][A

nll mean: 117.46868133544922 	 kl mean: 8.389556884765625 	 loss mean: 125.85824584960938
nll mean: 117.57647705078125 	 kl mean: 8.389556884765625 	 loss mean: 125.96601867675781
nll mean: 117.07936096191406 	 kl mean: 8.389556884765625 	 loss mean: 125.46891784667969



                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 10.05it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 10.05it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.23it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.23it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.23it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.23it/s]

nll mean: 117.52896881103516 	 kl mean: 8.389556884765625 	 loss mean: 125.91853332519531
nll mean: 117.472412109375 	 kl mean: 8.389556884765625 	 loss mean: 125.86197662353516
nll mean: 106.66954040527344 	 kl mean: 7.435132026672363 	 loss mean: 114.10467529296875
nll mean: 106.4617691040039 	 kl mean: 7.435132026672363 	 loss mean: 113.89689636230469
nll mean: 106.5548095703125 	 kl mean: 7.435132026672363 	 loss mean: 113.98994445800781



                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.23it/s]
 40%|████      | 4/10 [00:00<00:00, 33.15it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.23it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.23it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.23it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.23it/s][A
 80%|████████  | 8/10 [00:00<00:00, 33.09it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.23it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 32.91it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 106.52348327636719 	 kl mean: 7.435132026672363 	 loss mean: 113.9586181640625
nll mean: 106.34330749511719 	 kl mean: 7.435132026672363 	 loss mean: 113.7784423828125
nll mean: 106.84201049804688 	 kl mean: 7.435132026672363 	 loss mean: 114.27713012695312
nll mean: 106.31130981445312 	 kl mean: 7.435132026672363 	 loss mean: 113.74644470214844
nll mean: 105.65568542480469 	 kl mean: 7.435132026672363 	 loss mean: 113.09082794189453
nll mean: 106.74891662597656 	 kl mean: 7.435132026672363 	 loss mean: 114.18405151367188
nll mean: 106.16619873046875 	 kl mean: 7.435132026672363 	 loss mean: 113.60133361816406



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.51it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.51it/s]
 20%|██        | 2/10 [00:00<00:00, 14.69it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.51it/s][A

nll mean: 156.44967651367188 	 kl mean: 8.481588363647461 	 loss mean: 164.93125915527344
nll mean: 156.8223114013672 	 kl mean: 8.481588363647461 	 loss mean: 165.3039093017578
nll mean: 156.22315979003906 	 kl mean: 8.481588363647461 	 loss mean: 164.7047576904297



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.51it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.63it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.51it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.71it/s][A

nll mean: 155.79443359375 	 kl mean: 8.481588363647461 	 loss mean: 164.27603149414062
nll mean: 156.0535125732422 	 kl mean: 8.481588363647461 	 loss mean: 164.5351104736328
nll mean: 156.11175537109375 	 kl mean: 8.481588363647461 	 loss mean: 164.5933380126953



                                               
 61%|██████    | 23/38 [00:15<00:09,  1.51it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.51it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.73it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.51it/s][A

nll mean: 156.0625 	 kl mean: 8.481588363647461 	 loss mean: 164.54409790039062
nll mean: 156.8448944091797 	 kl mean: 8.481588363647461 	 loss mean: 165.32647705078125
nll mean: 156.43748474121094 	 kl mean: 8.481588363647461 	 loss mean: 164.91908264160156



                                               
 61%|██████    | 23/38 [00:15<00:09,  1.51it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.70it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
 30%|███       | 3/10 [00:00<00:00, 22.15it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A

nll mean: 156.18496704101562 	 kl mean: 8.481588363647461 	 loss mean: 164.6665496826172
nll mean: 119.71076202392578 	 kl mean: 8.97195053100586 	 loss mean: 128.68272399902344
nll mean: 119.46737670898438 	 kl mean: 8.97195053100586 	 loss mean: 128.4393310546875
nll mean: 119.74092102050781 	 kl mean: 8.97195053100586 	 loss mean: 128.71287536621094
nll mean: 120.03858947753906 	 kl mean: 8.97195053100586 	 loss mean: 129.01052856445312



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.94it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.77it/s][A

nll mean: 119.7779541015625 	 kl mean: 8.97195053100586 	 loss mean: 128.74990844726562
nll mean: 119.68639373779297 	 kl mean: 8.97195053100586 	 loss mean: 128.65834045410156
nll mean: 119.78663635253906 	 kl mean: 8.97195053100586 	 loss mean: 128.75857543945312
nll mean: 119.71583557128906 	 kl mean: 8.97195053100586 	 loss mean: 128.6877899169922
nll mean: 119.41404724121094 	 kl mean: 8.97195053100586 	 loss mean: 128.385986328125



                                               
100%|██████████| 10/10 [00:00<00:00, 21.48it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.62it/s][A

nll mean: 119.81599426269531 	 kl mean: 8.97195053100586 	 loss mean: 128.78793334960938
nll mean: 114.35356140136719 	 kl mean: 7.807682991027832 	 loss mean: 122.16123962402344
nll mean: 114.0194091796875 	 kl mean: 7.807682991027832 	 loss mean: 121.82708740234375



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.66it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A

nll mean: 114.51299285888672 	 kl mean: 7.807682991027832 	 loss mean: 122.3206787109375
nll mean: 114.15372467041016 	 kl mean: 7.807682991027832 	 loss mean: 121.96141052246094
nll mean: 113.68017578125 	 kl mean: 7.807682991027832 	 loss mean: 121.48786163330078



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.70it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.73it/s][A

nll mean: 113.82096099853516 	 kl mean: 7.807682991027832 	 loss mean: 121.62864685058594
nll mean: 114.16252899169922 	 kl mean: 7.807682991027832 	 loss mean: 121.97020721435547
nll mean: 113.6064453125 	 kl mean: 7.807682991027832 	 loss mean: 121.41412353515625



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.76it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]

nll mean: 113.87374877929688 	 kl mean: 7.807682991027832 	 loss mean: 121.68142700195312
nll mean: 114.03147888183594 	 kl mean: 7.807682991027832 	 loss mean: 121.83915710449219
nll mean: 82.22162628173828 	 kl mean: 7.792766571044922 	 loss mean: 90.01439666748047
nll mean: 81.55772399902344 	 kl mean: 7.792766571044922 	 loss mean: 89.3504867553711



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 21.29it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.50it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A

nll mean: 81.94904327392578 	 kl mean: 7.792766571044922 	 loss mean: 89.7418212890625
nll mean: 81.47286224365234 	 kl mean: 7.792766571044922 	 loss mean: 89.265625
nll mean: 81.66940307617188 	 kl mean: 7.792766571044922 	 loss mean: 89.46216583251953
nll mean: 81.62844848632812 	 kl mean: 7.792766571044922 	 loss mean: 89.42121887207031
nll mean: 81.48213958740234 	 kl mean: 7.792766571044922 	 loss mean: 89.27490234375



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.74it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.93it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]

nll mean: 81.62699127197266 	 kl mean: 7.792766571044922 	 loss mean: 89.41976165771484
nll mean: 81.89134216308594 	 kl mean: 7.792766571044922 	 loss mean: 89.68411254882812
nll mean: 81.9256591796875 	 kl mean: 7.792766571044922 	 loss mean: 89.71842956542969
nll mean: 108.40034484863281 	 kl mean: 8.099299430847168 	 loss mean: 116.49964904785156
nll mean: 108.38043212890625 	 kl mean: 8.099299430847168 	 loss mean: 116.479736328125



                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.84it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.83it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A

nll mean: 109.26569366455078 	 kl mean: 8.099299430847168 	 loss mean: 117.364990234375
nll mean: 108.7674331665039 	 kl mean: 8.099299430847168 	 loss mean: 116.86672973632812
nll mean: 108.86984252929688 	 kl mean: 8.099299430847168 	 loss mean: 116.96914672851562
nll mean: 108.76264190673828 	 kl mean: 8.099299430847168 	 loss mean: 116.8619384765625
nll mean: 108.09693908691406 	 kl mean: 8.099299430847168 	 loss mean: 116.19624328613281



                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.90it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.86it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]

nll mean: 108.38932800292969 	 kl mean: 8.099299430847168 	 loss mean: 116.48863220214844
nll mean: 108.47962951660156 	 kl mean: 8.099299430847168 	 loss mean: 116.57893371582031
nll mean: 108.7413101196289 	 kl mean: 8.099299430847168 	 loss mean: 116.84062194824219
nll mean: 121.26044464111328 	 kl mean: 8.292230606079102 	 loss mean: 129.55267333984375



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.35it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.41it/s][A

nll mean: 121.08564758300781 	 kl mean: 8.292230606079102 	 loss mean: 129.37786865234375
nll mean: 121.49658966064453 	 kl mean: 8.292230606079102 	 loss mean: 129.788818359375
nll mean: 121.22872924804688 	 kl mean: 8.292230606079102 	 loss mean: 129.52096557617188



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.53it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A

nll mean: 121.61955261230469 	 kl mean: 8.292230606079102 	 loss mean: 129.91177368164062
nll mean: 121.55934143066406 	 kl mean: 8.292230606079102 	 loss mean: 129.8515625
nll mean: 121.70130920410156 	 kl mean: 8.292230606079102 	 loss mean: 129.99354553222656



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.51it/s][A
                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.49it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 121.52679443359375 	 kl mean: 8.292230606079102 	 loss mean: 129.8190155029297
nll mean: 121.60061645507812 	 kl mean: 8.292230606079102 	 loss mean: 129.89285278320312
nll mean: 121.16522979736328 	 kl mean: 8.292230606079102 	 loss mean: 129.45745849609375



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 10%|█         | 1/10 [00:00<00:00,  9.87it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
                                               
 10%|█         | 1/10 [00:00<00:00,  9.87it/s][A

nll mean: 61.82196807861328 	 kl mean: 8.595566749572754 	 loss mean: 70.41753387451172
nll mean: 61.69194793701172 	 kl mean: 8.595566749572754 	 loss mean: 70.28751373291016
nll mean: 62.20570373535156 	 kl mean: 8.595566749572754 	 loss mean: 70.80126953125


 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 30%|███       | 3/10 [00:00<00:00,  9.92it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.90it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.90it/s][A


nll mean: 61.384803771972656 	 kl mean: 8.595566749572754 	 loss mean: 69.9803695678711
nll mean: 62.18488693237305 	 kl mean: 8.595566749572754 	 loss mean: 70.78045654296875


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.88it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.89it/s][A


nll mean: 61.94266891479492 	 kl mean: 8.595566749572754 	 loss mean: 70.53823852539062
nll mean: 62.290950775146484 	 kl mean: 8.595566749572754 	 loss mean: 70.88652038574219


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.88it/s][A
                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.88it/s][A

nll mean: 61.832252502441406 	 kl mean: 8.595566749572754 	 loss mean: 70.42781829833984
nll mean: 61.77894973754883 	 kl mean: 8.595566749572754 	 loss mean: 70.37451171875



                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.88it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.75it/s][A

nll mean: 61.91265869140625 	 kl mean: 8.595566749572754 	 loss mean: 70.50822448730469
nll mean: 105.65850830078125 	 kl mean: 8.126787185668945 	 loss mean: 113.78529357910156
nll mean: 105.22845458984375 	 kl mean: 8.126787185668945 	 loss mean: 113.35523223876953


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 20%|██        | 2/10 [00:00<00:00, 12.75it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 40%|████      | 4/10 [00:00<00:00, 12.68it/s][A

nll mean: 105.40792846679688 	 kl mean: 8.126787185668945 	 loss mean: 113.53472137451172
nll mean: 105.205810546875 	 kl mean: 8.126787185668945 	 loss mean: 113.33261108398438
nll mean: 105.04230499267578 	 kl mean: 8.126787185668945 	 loss mean: 113.16908264160156


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 40%|████      | 4/10 [00:00<00:00, 12.68it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.59it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.46it/s][A

nll mean: 105.08944702148438 	 kl mean: 8.126787185668945 	 loss mean: 113.21623992919922
nll mean: 105.1138916015625 	 kl mean: 8.126787185668945 	 loss mean: 113.24068450927734
nll mean: 105.70335388183594 	 kl mean: 8.126787185668945 	 loss mean: 113.83013153076172


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.41it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.32it/s]
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:00,  9.75it/s][A

nll mean: 105.11683654785156 	 kl mean: 8.126787185668945 	 loss mean: 113.24362182617188
nll mean: 104.93414306640625 	 kl mean: 8.126787185668945 	 loss mean: 113.06092071533203
nll mean: 137.44943237304688 	 kl mean: 8.899723052978516 	 loss mean: 146.34915161132812


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 10%|█         | 1/10 [00:00<00:00,  9.75it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 20%|██        | 2/10 [00:00<00:00,  9.76it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.82it/s][A

nll mean: 137.0643310546875 	 kl mean: 8.899723052978516 	 loss mean: 145.96405029296875
nll mean: 137.7585906982422 	 kl mean: 8.899723052978516 	 loss mean: 146.6583251953125


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00,  9.82it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 40%|████      | 4/10 [00:00<00:00,  9.84it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.82it/s][A

nll mean: 137.15335083007812 	 kl mean: 8.899723052978516 	 loss mean: 146.05307006835938
nll mean: 137.7014617919922 	 kl mean: 8.899723052978516 	 loss mean: 146.60118103027344


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.82it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.86it/s][A

nll mean: 137.76358032226562 	 kl mean: 8.899723052978516 	 loss mean: 146.66329956054688
nll mean: 137.0815887451172 	 kl mean: 8.899723052978516 	 loss mean: 145.98130798339844


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.86it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.89it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.87it/s][A

nll mean: 138.16375732421875 	 kl mean: 8.899723052978516 	 loss mean: 147.0634765625
nll mean: 136.9967041015625 	 kl mean: 8.899723052978516 	 loss mean: 145.8964385986328


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.87it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.84it/s][A
 84%|████████▍ | 32/38 [00:20<00:05,  1.19it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
 30%|███       | 3/10 [00:00<00:00, 24.95it/s][A

nll mean: 138.10665893554688 	 kl mean: 8.899723052978516 	 loss mean: 147.00637817382812
nll mean: 65.22412109375 	 kl mean: 7.549360275268555 	 loss mean: 72.77348327636719
nll mean: 64.59063720703125 	 kl mean: 7.549360275268555 	 loss mean: 72.13999938964844
nll mean: 64.26605987548828 	 kl mean: 7.549360275268555 	 loss mean: 71.81542205810547
nll mean: 64.11370849609375 	 kl mean: 7.549360275268555 	 loss mean: 71.66307067871094


                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
 30%|███       | 3/10 [00:00<00:00, 24.95it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.75it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.60it/s][A

nll mean: 64.39350128173828 	 kl mean: 7.549360275268555 	 loss mean: 71.94285583496094
nll mean: 64.7524185180664 	 kl mean: 7.549360275268555 	 loss mean: 72.3017807006836
nll mean: 64.05459594726562 	 kl mean: 7.549360275268555 	 loss mean: 71.60395812988281
nll mean: 64.69367218017578 	 kl mean: 7.549360275268555 	 loss mean: 72.24302673339844
nll mean: 64.17796325683594 	 kl mean: 7.549360275268555 	 loss mean: 71.7273178100586


                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
100%|██████████| 10/10 [00:00<00:00, 24.42it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.41it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.41it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.41it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.41it/s]
 30%|███       | 3/10 [00:00<00:00, 21.49it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.41it/s][A

nll mean: 64.26854705810547 	 kl mean: 7.549360275268555 	 loss mean: 71.81790924072266
nll mean: 117.96626281738281 	 kl mean: 7.9364800453186035 	 loss mean: 125.90274047851562
nll mean: 118.39134216308594 	 kl mean: 7.9364800453186035 	 loss mean: 126.32781982421875
nll mean: 118.25416564941406 	 kl mean: 7.9364800453186035 	 loss mean: 126.19064331054688
nll mean: 117.64432525634766 	 kl mean: 7.9364800453186035 	 loss mean: 125.580810546875



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.41it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.41it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.44it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.41it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.41it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.41it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.39it/s][A

nll mean: 117.11048889160156 	 kl mean: 7.9364800453186035 	 loss mean: 125.0469741821289
nll mean: 117.35755920410156 	 kl mean: 7.9364800453186035 	 loss mean: 125.2940444946289
nll mean: 117.4644775390625 	 kl mean: 7.9364800453186035 	 loss mean: 125.40095520019531
nll mean: 117.57698059082031 	 kl mean: 7.9364800453186035 	 loss mean: 125.51345825195312
nll mean: 118.08432006835938 	 kl mean: 7.9364800453186035 	 loss mean: 126.02081298828125



                                               
100%|██████████| 10/10 [00:00<00:00, 21.33it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.57it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.57it/s]
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.48it/s][A

nll mean: 117.98111724853516 	 kl mean: 7.9364800453186035 	 loss mean: 125.91758728027344
nll mean: 119.80219268798828 	 kl mean: 8.429821014404297 	 loss mean: 128.23202514648438
nll mean: 119.70445251464844 	 kl mean: 8.429821014404297 	 loss mean: 128.13427734375


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.57it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 12.48it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.57it/s]
 40%|████      | 4/10 [00:00<00:00, 12.48it/s][A

nll mean: 119.88495635986328 	 kl mean: 8.429821014404297 	 loss mean: 128.3147735595703
nll mean: 119.91922760009766 	 kl mean: 8.429821014404297 	 loss mean: 128.3490447998047
nll mean: 119.86844635009766 	 kl mean: 8.429821014404297 	 loss mean: 128.29827880859375


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.57it/s]
 40%|████      | 4/10 [00:00<00:00, 12.48it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.57it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.51it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.55it/s][A

nll mean: 119.57149505615234 	 kl mean: 8.429821014404297 	 loss mean: 128.00131225585938
nll mean: 118.86451721191406 	 kl mean: 8.429821014404297 	 loss mean: 127.2943344116211
nll mean: 119.81834411621094 	 kl mean: 8.429821014404297 	 loss mean: 128.2481689453125


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.57it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.55it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.58it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]

nll mean: 119.39707946777344 	 kl mean: 8.429821014404297 	 loss mean: 127.826904296875
nll mean: 119.54864501953125 	 kl mean: 8.429821014404297 	 loss mean: 127.97846221923828
nll mean: 112.95330810546875 	 kl mean: 8.09145736694336 	 loss mean: 121.04476165771484



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.60it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.62it/s][A

nll mean: 112.58529663085938 	 kl mean: 8.09145736694336 	 loss mean: 120.6767578125
nll mean: 112.42642211914062 	 kl mean: 8.09145736694336 	 loss mean: 120.51788330078125
nll mean: 112.92855834960938 	 kl mean: 8.09145736694336 	 loss mean: 121.02001953125



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.64it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A

nll mean: 112.63465881347656 	 kl mean: 8.09145736694336 	 loss mean: 120.72611999511719
nll mean: 112.62867736816406 	 kl mean: 8.09145736694336 	 loss mean: 120.72013092041016
nll mean: 112.34477233886719 	 kl mean: 8.09145736694336 	 loss mean: 120.43621826171875



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.63it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.60it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 112.80260467529297 	 kl mean: 8.09145736694336 	 loss mean: 120.89405822753906
nll mean: 112.81804656982422 	 kl mean: 8.09145736694336 	 loss mean: 120.90950012207031
nll mean: 112.62669372558594 	 kl mean: 8.09145736694336 	 loss mean: 120.71815490722656



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 23.47it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A

nll mean: 110.98330688476562 	 kl mean: 8.196907997131348 	 loss mean: 119.18021392822266
nll mean: 111.12200927734375 	 kl mean: 8.196907997131348 	 loss mean: 119.31892395019531
nll mean: 110.86534881591797 	 kl mean: 8.196907997131348 	 loss mean: 119.062255859375
nll mean: 110.77885437011719 	 kl mean: 8.196907997131348 	 loss mean: 118.97576904296875
nll mean: 111.00802612304688 	 kl mean: 8.196907997131348 	 loss mean: 119.20492553710938



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.94it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.20it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 22.00it/s][A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 110.91123962402344 	 kl mean: 8.196907997131348 	 loss mean: 119.10813903808594
nll mean: 110.76701354980469 	 kl mean: 8.196907997131348 	 loss mean: 118.96392059326172
nll mean: 110.53801727294922 	 kl mean: 8.196907997131348 	 loss mean: 118.73492431640625
nll mean: 110.54814147949219 	 kl mean: 8.196907997131348 	 loss mean: 118.74504852294922
nll mean: 111.1124267578125 	 kl mean: 8.196907997131348 	 loss mean: 119.30933380126953



                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 30.72it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A

nll mean: 85.61244201660156 	 kl mean: 8.369827270507812 	 loss mean: 93.98226165771484
nll mean: 86.34038543701172 	 kl mean: 8.369827270507812 	 loss mean: 94.710205078125
nll mean: 85.90811157226562 	 kl mean: 8.369827270507812 	 loss mean: 94.27793884277344
nll mean: 86.31980895996094 	 kl mean: 8.369827270507812 	 loss mean: 94.68963623046875
nll mean: 86.82305908203125 	 kl mean: 8.369827270507812 	 loss mean: 95.19288635253906
nll mean: 86.4614486694336 	 kl mean: 8.369827270507812 	 loss mean: 94.83128356933594
nll mean: 85.48399353027344 	 kl mean: 8.369827270507812 	 loss mean: 93.85382080078125



                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
 80%|████████  | 8/10 [00:00<00:00, 30.64it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 30.55it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.56it/s]


nll mean: 85.46953582763672 	 kl mean: 8.369827270507812 	 loss mean: 93.83935546875
nll mean: 86.06120300292969 	 kl mean: 8.369827270507812 	 loss mean: 94.4310302734375
nll mean: 86.79721069335938 	 kl mean: 8.369827270507812 	 loss mean: 95.16703796386719
Approximate NLL:
tensor(121.1578, device='cuda:0')
Approximate KL:
tensor(8.2359, device='cuda:0')
Testing took 0:00:25.392685


In [16]:
print(fb_nlls)

[tensor(121.0295, device='cuda:0'), tensor(120.7947, device='cuda:0'), tensor(120.9791, device='cuda:0'), tensor(121.1578, device='cuda:0')]


# MDR

In [17]:
saved_model_files = get_model_filenames('mdr10')
saved_model_files

['results_final/results0/mdr10/models/sentence_vae_MDR_10.0_3500.pt',
 'results_final/results1/mdr10/models/sentence_vae_MDR_10.0_3500.pt',
 'results_final/results2/mdr10/models/sentence_vae_MDR_10.0_3500.pt',
 'results_final/results3/mdr10/models/sentence_vae_MDR_10.0_3500.pt']

In [18]:
mdr_nlls, mdr_kls = get_approx_nlls(saved_model_files)

  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 25.62it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].62it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].62it/s][A

nll mean: 108.19682312011719 	 kl mean: 10.452482223510742 	 loss mean: 118.64930725097656
nll mean: 108.15377807617188 	 kl mean: 10.452482223510742 	 loss mean: 118.60625457763672
nll mean: 108.36959075927734 	 kl mean: 10.452482223510742 	 loss mean: 118.82207489013672
nll mean: 108.12532806396484 	 kl mean: 10.452482223510742 	 loss mean: 118.57780456542969
nll mean: 107.88681030273438 	 kl mean: 10.452482223510742 	 loss mean: 118.33929443359375



                                              
  0%|          | 0/38 [00:00<?, ?it/s].62it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.29it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].29it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].29it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].29it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.03it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 24.81it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 108.36609649658203 	 kl mean: 10.452482223510742 	 loss mean: 118.8185806274414
nll mean: 107.93036651611328 	 kl mean: 10.452482223510742 	 loss mean: 118.38285827636719
nll mean: 108.16333770751953 	 kl mean: 10.452482223510742 	 loss mean: 118.61582946777344
nll mean: 107.99119567871094 	 kl mean: 10.452482223510742 	 loss mean: 118.44367980957031
nll mean: 107.82710266113281 	 kl mean: 10.452482223510742 	 loss mean: 118.27958679199219


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 20%|██        | 2/10 [00:00<00:00, 14.36it/s][A

nll mean: 125.21853637695312 	 kl mean: 10.13413143157959 	 loss mean: 135.3526611328125
nll mean: 125.54822540283203 	 kl mean: 10.13413143157959 	 loss mean: 135.68235778808594
nll mean: 125.06880187988281 	 kl mean: 10.13413143157959 	 loss mean: 135.20291137695312


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 20%|██        | 2/10 [00:00<00:00, 14.36it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 40%|████      | 4/10 [00:00<00:00, 14.20it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.19it/s][A

nll mean: 125.16719055175781 	 kl mean: 10.13413143157959 	 loss mean: 135.3013153076172
nll mean: 125.37632751464844 	 kl mean: 10.13413143157959 	 loss mean: 135.51046752929688
nll mean: 125.75092315673828 	 kl mean: 10.13413143157959 	 loss mean: 135.8850555419922


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.19it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.08it/s][A

nll mean: 125.28334045410156 	 kl mean: 10.13413143157959 	 loss mean: 135.41748046875
nll mean: 125.42881774902344 	 kl mean: 10.13413143157959 	 loss mean: 135.56295776367188
nll mean: 125.19739532470703 	 kl mean: 10.13413143157959 	 loss mean: 135.33154296875


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.08it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.03it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 25.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A

nll mean: 125.1697998046875 	 kl mean: 10.13413143157959 	 loss mean: 135.30393981933594
nll mean: 98.01310729980469 	 kl mean: 9.430135726928711 	 loss mean: 107.44324493408203
nll mean: 98.12969207763672 	 kl mean: 9.430135726928711 	 loss mean: 107.55982971191406
nll mean: 98.22184753417969 	 kl mean: 9.430135726928711 	 loss mean: 107.65198516845703
nll mean: 98.04600524902344 	 kl mean: 9.430135726928711 	 loss mean: 107.47615051269531



                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.96it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.80it/s][A

nll mean: 98.05474853515625 	 kl mean: 9.430135726928711 	 loss mean: 107.48489379882812
nll mean: 98.07473754882812 	 kl mean: 9.430135726928711 	 loss mean: 107.50486755371094
nll mean: 97.74529266357422 	 kl mean: 9.430135726928711 	 loss mean: 107.17543029785156
nll mean: 98.2998046875 	 kl mean: 9.430135726928711 	 loss mean: 107.72993469238281
nll mean: 97.98301696777344 	 kl mean: 9.430135726928711 	 loss mean: 107.41314697265625



                                              
100%|██████████| 10/10 [00:00<00:00, 24.69it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
 20%|██        | 2/10 [00:00<00:00, 10.75it/s][A

nll mean: 98.20999145507812 	 kl mean: 9.430135726928711 	 loss mean: 107.64012145996094
nll mean: 137.75311279296875 	 kl mean: 10.020685195922852 	 loss mean: 147.7738037109375
nll mean: 137.92376708984375 	 kl mean: 10.020685195922852 	 loss mean: 147.9444580078125



                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.81it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s][A

nll mean: 138.12890625 	 kl mean: 10.020685195922852 	 loss mean: 148.14959716796875
nll mean: 137.90658569335938 	 kl mean: 10.020685195922852 	 loss mean: 147.92727661132812
nll mean: 137.63357543945312 	 kl mean: 10.020685195922852 	 loss mean: 147.6542510986328



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.83it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.84it/s][A

nll mean: 138.3811798095703 	 kl mean: 10.020685195922852 	 loss mean: 148.40185546875
nll mean: 137.02511596679688 	 kl mean: 10.020685195922852 	 loss mean: 147.04580688476562
nll mean: 137.7676544189453 	 kl mean: 10.020685195922852 	 loss mean: 147.78834533691406



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.83it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]

nll mean: 138.10968017578125 	 kl mean: 10.020685195922852 	 loss mean: 148.13037109375
nll mean: 137.92852783203125 	 kl mean: 10.020685195922852 	 loss mean: 147.94921875
nll mean: 122.16737365722656 	 kl mean: 9.447097778320312 	 loss mean: 131.61447143554688



                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.04it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.94it/s][A

nll mean: 122.41455078125 	 kl mean: 9.447097778320312 	 loss mean: 131.8616485595703
nll mean: 122.40802001953125 	 kl mean: 9.447097778320312 	 loss mean: 131.8551025390625
nll mean: 122.72557830810547 	 kl mean: 9.447097778320312 	 loss mean: 132.1726837158203



                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.94it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A

nll mean: 122.31828308105469 	 kl mean: 9.447097778320312 	 loss mean: 131.765380859375
nll mean: 122.58068084716797 	 kl mean: 9.447097778320312 	 loss mean: 132.02777099609375
nll mean: 122.7999267578125 	 kl mean: 9.447097778320312 	 loss mean: 132.2470245361328



                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.99it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.98it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 122.77609252929688 	 kl mean: 9.447097778320312 	 loss mean: 132.22317504882812
nll mean: 122.54804992675781 	 kl mean: 9.447097778320312 	 loss mean: 131.99514770507812
nll mean: 122.5537109375 	 kl mean: 9.447097778320312 	 loss mean: 132.0008087158203



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.53it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 121.76243591308594 	 kl mean: 9.413286209106445 	 loss mean: 131.17572021484375
nll mean: 122.3392333984375 	 kl mean: 9.413286209106445 	 loss mean: 131.7525177001953
nll mean: 122.3698959350586 	 kl mean: 9.413286209106445 	 loss mean: 131.78317260742188



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.40it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.21it/s][A

nll mean: 121.50656127929688 	 kl mean: 9.413286209106445 	 loss mean: 130.91986083984375
nll mean: 122.07917785644531 	 kl mean: 9.413286209106445 	 loss mean: 131.49246215820312
nll mean: 122.07177734375 	 kl mean: 9.413286209106445 	 loss mean: 131.48504638671875



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.22it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 121.65574645996094 	 kl mean: 9.413286209106445 	 loss mean: 131.06903076171875
nll mean: 121.77169036865234 	 kl mean: 9.413286209106445 	 loss mean: 131.18496704101562
nll mean: 122.02293395996094 	 kl mean: 9.413286209106445 	 loss mean: 131.43621826171875



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.15it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.54it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A

nll mean: 121.91781616210938 	 kl mean: 9.413286209106445 	 loss mean: 131.33111572265625
nll mean: 132.42645263671875 	 kl mean: 9.404303550720215 	 loss mean: 141.83074951171875
nll mean: 132.5816192626953 	 kl mean: 9.404303550720215 	 loss mean: 141.98593139648438
nll mean: 132.16738891601562 	 kl mean: 9.404303550720215 	 loss mean: 141.57168579101562
nll mean: 132.5492706298828 	 kl mean: 9.404303550720215 	 loss mean: 141.95355224609375



                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.30it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.07it/s][A

nll mean: 132.02151489257812 	 kl mean: 9.404303550720215 	 loss mean: 141.42581176757812
nll mean: 132.77508544921875 	 kl mean: 9.404303550720215 	 loss mean: 142.17938232421875
nll mean: 132.61529541015625 	 kl mean: 9.404303550720215 	 loss mean: 142.01959228515625
nll mean: 132.47329711914062 	 kl mean: 9.404303550720215 	 loss mean: 141.87759399414062
nll mean: 132.5237274169922 	 kl mean: 9.404303550720215 	 loss mean: 141.92803955078125



                                              
100%|██████████| 10/10 [00:00<00:00, 24.87it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 24.59it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A

nll mean: 132.5174102783203 	 kl mean: 9.404303550720215 	 loss mean: 141.92172241210938
nll mean: 104.56591796875 	 kl mean: 9.469480514526367 	 loss mean: 114.03539276123047
nll mean: 104.46375274658203 	 kl mean: 9.469480514526367 	 loss mean: 113.93323516845703
nll mean: 104.56465911865234 	 kl mean: 9.469480514526367 	 loss mean: 114.03413391113281
nll mean: 104.36221313476562 	 kl mean: 9.469480514526367 	 loss mean: 113.8316879272461



                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.60it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.61it/s][A

nll mean: 104.16090393066406 	 kl mean: 9.469480514526367 	 loss mean: 113.63038635253906
nll mean: 104.56173706054688 	 kl mean: 9.469480514526367 	 loss mean: 114.03121948242188
nll mean: 104.2738265991211 	 kl mean: 9.469480514526367 	 loss mean: 113.74330139160156
nll mean: 104.2199478149414 	 kl mean: 9.469480514526367 	 loss mean: 113.6894302368164
nll mean: 104.09166717529297 	 kl mean: 9.469480514526367 	 loss mean: 113.56114959716797



                                              
100%|██████████| 10/10 [00:00<00:00, 24.60it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.55it/s][A

nll mean: 104.5696029663086 	 kl mean: 9.469480514526367 	 loss mean: 114.0390853881836
nll mean: 130.30514526367188 	 kl mean: 10.190142631530762 	 loss mean: 140.49530029296875
nll mean: 129.8035125732422 	 kl mean: 10.190142631530762 	 loss mean: 139.99365234375


                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
 20%|██        | 2/10 [00:00<00:00, 14.55it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
                                              [A
                                              

nll mean: 129.84619140625 	 kl mean: 10.190142631530762 	 loss mean: 140.03634643554688
nll mean: 129.6634521484375 	 kl mean: 10.190142631530762 	 loss mean: 139.85357666015625
nll mean: 130.01055908203125 	 kl mean: 10.190142631530762 	 loss mean: 140.20071411132812


 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 40%|████      | 4/10 [00:00<00:00, 14.56it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.90it/s][A
                                              [A

nll mean: 129.62078857421875 	 kl mean: 10.190142631530762 	 loss mean: 139.81092834472656
nll mean: 130.2579803466797 	 kl mean: 10.190142631530762 	 loss mean: 140.4481201171875
nll mean: 129.81491088867188 	 kl mean: 10.190142631530762 	 loss mean: 140.0050506591797



 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.84it/s][A
100%|██████████| 10/10 [00:00<00:00, 15.03it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.75it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.75it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.75it/s]


nll mean: 129.58180236816406 	 kl mean: 10.190142631530762 	 loss mean: 139.77194213867188
nll mean: 129.82455444335938 	 kl mean: 10.190142631530762 	 loss mean: 140.01467895507812
nll mean: 128.85986328125 	 kl mean: 9.887764930725098 	 loss mean: 138.74761962890625
nll mean: 128.3947296142578 	 kl mean: 9.887764930725098 	 loss mean: 138.28250122070312


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.75it/s]
 30%|███       | 3/10 [00:00<00:00, 22.04it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.75it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.75it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.75it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.72it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.75it/s][A

nll mean: 129.20071411132812 	 kl mean: 9.887764930725098 	 loss mean: 139.08848571777344
nll mean: 129.38577270507812 	 kl mean: 9.887764930725098 	 loss mean: 139.2735595703125
nll mean: 128.85092163085938 	 kl mean: 9.887764930725098 	 loss mean: 138.73867797851562
nll mean: 129.42221069335938 	 kl mean: 9.887764930725098 	 loss mean: 139.3099822998047
nll mean: 128.78250122070312 	 kl mean: 9.887764930725098 	 loss mean: 138.67025756835938



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.75it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.75it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.48it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 21.36it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 128.9536590576172 	 kl mean: 9.887764930725098 	 loss mean: 138.8414306640625
nll mean: 129.0346221923828 	 kl mean: 9.887764930725098 	 loss mean: 138.92239379882812
nll mean: 129.26605224609375 	 kl mean: 9.887764930725098 	 loss mean: 139.15380859375
nll mean: 116.44232940673828 	 kl mean: 10.088533401489258 	 loss mean: 126.5308609008789
nll mean: 116.98440551757812 	 kl mean: 10.088533401489258 	 loss mean: 127.07293701171875


                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:05<00:15,  1.85it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
 30%|███       | 3/10 [00:00<00:00, 24.77it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.71it/s][A

nll mean: 116.62828826904297 	 kl mean: 10.088533401489258 	 loss mean: 126.7168197631836
nll mean: 116.54360961914062 	 kl mean: 10.088533401489258 	 loss mean: 126.63214874267578
nll mean: 116.23208618164062 	 kl mean: 10.088533401489258 	 loss mean: 126.32061767578125
nll mean: 116.2840347290039 	 kl mean: 10.088533401489258 	 loss mean: 126.37256622314453
nll mean: 116.24638366699219 	 kl mean: 10.088533401489258 	 loss mean: 126.33492279052734


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.71it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.85it/s]
100%|██████████| 10/10 [00:00<00:00, 24.74it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]

nll mean: 116.63066101074219 	 kl mean: 10.088533401489258 	 loss mean: 126.71919250488281
nll mean: 116.08271026611328 	 kl mean: 10.088533401489258 	 loss mean: 126.1712417602539
nll mean: 117.03131866455078 	 kl mean: 10.088533401489258 	 loss mean: 127.11985778808594
nll mean: 139.37388610839844 	 kl mean: 9.788990020751953 	 loss mean: 149.16287231445312
nll mean: 139.48263549804688 	 kl mean: 9.788990020751953 	 loss mean: 149.2716064453125



                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s]
 30%|███       | 3/10 [00:00<00:00, 21.08it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.00it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A

nll mean: 139.46560668945312 	 kl mean: 9.788990020751953 	 loss mean: 149.25457763671875
nll mean: 139.47015380859375 	 kl mean: 9.788990020751953 	 loss mean: 149.25914001464844
nll mean: 139.53176879882812 	 kl mean: 9.788990020751953 	 loss mean: 149.32073974609375
nll mean: 139.17315673828125 	 kl mean: 9.788990020751953 	 loss mean: 148.962158203125
nll mean: 139.8402099609375 	 kl mean: 9.788990020751953 	 loss mean: 149.62921142578125



                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  2.00it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.07it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.13it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]

nll mean: 139.40602111816406 	 kl mean: 9.788990020751953 	 loss mean: 149.19500732421875
nll mean: 139.66905212402344 	 kl mean: 9.788990020751953 	 loss mean: 149.45803833007812
nll mean: 139.41387939453125 	 kl mean: 9.788990020751953 	 loss mean: 149.20286560058594
nll mean: 117.91265869140625 	 kl mean: 10.054593086242676 	 loss mean: 127.9672622680664



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s]
 20%|██        | 2/10 [00:00<00:00, 12.60it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.03it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.63it/s][A

nll mean: 118.40821075439453 	 kl mean: 10.054593086242676 	 loss mean: 128.46279907226562
nll mean: 118.62303161621094 	 kl mean: 10.054593086242676 	 loss mean: 128.67762756347656
nll mean: 118.55799865722656 	 kl mean: 10.054593086242676 	 loss mean: 128.6125946044922



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.65it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A

nll mean: 118.48039245605469 	 kl mean: 10.054593086242676 	 loss mean: 128.5349884033203
nll mean: 118.00888061523438 	 kl mean: 10.054593086242676 	 loss mean: 128.0634765625
nll mean: 117.80635070800781 	 kl mean: 10.054593086242676 	 loss mean: 127.86094665527344



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.56it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.03it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.55it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.31461334228516 	 kl mean: 10.054593086242676 	 loss mean: 128.36920166015625
nll mean: 117.71556091308594 	 kl mean: 10.054593086242676 	 loss mean: 127.77015686035156
nll mean: 118.12704467773438 	 kl mean: 10.054593086242676 	 loss mean: 128.181640625



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 10%|█         | 1/10 [00:00<00:00,  9.95it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.91it/s][A
                                              

nll mean: 159.811279296875 	 kl mean: 10.681200981140137 	 loss mean: 170.49249267578125
nll mean: 159.2489013671875 	 kl mean: 10.681200981140137 	 loss mean: 169.93011474609375


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.92it/s][A
                                               


nll mean: 159.30992126464844 	 kl mean: 10.681200981140137 	 loss mean: 169.99111938476562
nll mean: 159.42279052734375 	 kl mean: 10.681200981140137 	 loss mean: 170.10398864746094
nll mean: 159.1752471923828 	 kl mean: 10.681200981140137 	 loss mean: 169.8564453125


 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.95it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.90it/s][A


nll mean: 159.6563720703125 	 kl mean: 10.681200981140137 	 loss mean: 170.33758544921875
nll mean: 159.53501892089844 	 kl mean: 10.681200981140137 	 loss mean: 170.21621704101562


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.93it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.88it/s][A

nll mean: 159.8271026611328 	 kl mean: 10.681200981140137 	 loss mean: 170.50830078125
nll mean: 159.26150512695312 	 kl mean: 10.681200981140137 	 loss mean: 169.94271850585938



                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.92it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.42it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A

nll mean: 159.3924560546875 	 kl mean: 10.681200981140137 	 loss mean: 170.0736541748047
nll mean: 132.8720703125 	 kl mean: 9.206886291503906 	 loss mean: 142.07894897460938
nll mean: 133.48391723632812 	 kl mean: 9.206886291503906 	 loss mean: 142.6907958984375
nll mean: 133.35101318359375 	 kl mean: 9.206886291503906 	 loss mean: 142.55789184570312



                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 40%|████      | 4/10 [00:00<00:00, 18.13it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 60%|██████    | 6/10 [00:00<00:00, 18.11it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A

nll mean: 133.59890747070312 	 kl mean: 9.206886291503906 	 loss mean: 142.80580139160156
nll mean: 133.25164794921875 	 kl mean: 9.206886291503906 	 loss mean: 142.45852661132812
nll mean: 134.0250701904297 	 kl mean: 9.206886291503906 	 loss mean: 143.23196411132812
nll mean: 133.44361877441406 	 kl mean: 9.206886291503906 	 loss mean: 142.6505126953125



                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 80%|████████  | 8/10 [00:00<00:00, 18.01it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.95it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 133.32281494140625 	 kl mean: 9.206886291503906 	 loss mean: 142.52969360351562
nll mean: 133.22674560546875 	 kl mean: 9.206886291503906 	 loss mean: 142.4336395263672
nll mean: 133.413818359375 	 kl mean: 9.206886291503906 	 loss mean: 142.62069702148438


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 20%|██        | 2/10 [00:00<00:00, 10.80it/s][A

nll mean: 141.9861602783203 	 kl mean: 9.931474685668945 	 loss mean: 151.91763305664062
nll mean: 142.20660400390625 	 kl mean: 9.931474685668945 	 loss mean: 152.13807678222656
nll mean: 142.2542724609375 	 kl mean: 9.931474685668945 	 loss mean: 152.18576049804688


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 20%|██        | 2/10 [00:00<00:00, 10.80it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 40%|████      | 4/10 [00:00<00:00, 10.82it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.81it/s][A

nll mean: 142.24234008789062 	 kl mean: 9.931474685668945 	 loss mean: 152.173828125
nll mean: 141.906494140625 	 kl mean: 9.931474685668945 	 loss mean: 151.83798217773438
nll mean: 141.96763610839844 	 kl mean: 9.931474685668945 	 loss mean: 151.89910888671875


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.81it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.78it/s][A

nll mean: 141.633056640625 	 kl mean: 9.931474685668945 	 loss mean: 151.5645294189453
nll mean: 142.2028350830078 	 kl mean: 9.931474685668945 	 loss mean: 152.13430786132812
nll mean: 142.18197631835938 	 kl mean: 9.931474685668945 	 loss mean: 152.11343383789062


                                               
 39%|███▉      | 15/38 [00:10<00:15,  1.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.78it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.73it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 24.62it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A

nll mean: 142.11883544921875 	 kl mean: 9.931474685668945 	 loss mean: 152.05032348632812
nll mean: 143.69100952148438 	 kl mean: 9.441064834594727 	 loss mean: 153.13206481933594
nll mean: 144.36087036132812 	 kl mean: 9.441064834594727 	 loss mean: 153.80194091796875
nll mean: 143.43096923828125 	 kl mean: 9.441064834594727 	 loss mean: 152.87203979492188
nll mean: 143.60708618164062 	 kl mean: 9.441064834594727 	 loss mean: 153.0481414794922



                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.48it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.50it/s][A

nll mean: 144.1976318359375 	 kl mean: 9.441064834594727 	 loss mean: 153.63868713378906
nll mean: 144.0448760986328 	 kl mean: 9.441064834594727 	 loss mean: 153.48594665527344
nll mean: 144.49478149414062 	 kl mean: 9.441064834594727 	 loss mean: 153.93585205078125
nll mean: 143.99105834960938 	 kl mean: 9.441064834594727 	 loss mean: 153.43212890625
nll mean: 144.42555236816406 	 kl mean: 9.441064834594727 	 loss mean: 153.8666229248047



                                               
100%|██████████| 10/10 [00:00<00:00, 24.41it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 24.92it/s][A

nll mean: 144.374755859375 	 kl mean: 9.441064834594727 	 loss mean: 153.8157958984375
nll mean: 132.9092254638672 	 kl mean: 9.616434097290039 	 loss mean: 142.52566528320312
nll mean: 133.41549682617188 	 kl mean: 9.616434097290039 	 loss mean: 143.0319366455078
nll mean: 132.55111694335938 	 kl mean: 9.616434097290039 	 loss mean: 142.1675567626953
nll mean: 133.39022827148438 	 kl mean: 9.616434097290039 	 loss mean: 143.00668334960938


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 24.92it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.88it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.83it/s][A

nll mean: 132.43673706054688 	 kl mean: 9.616434097290039 	 loss mean: 142.05316162109375
nll mean: 133.14089965820312 	 kl mean: 9.616434097290039 	 loss mean: 142.75732421875
nll mean: 133.24966430664062 	 kl mean: 9.616434097290039 	 loss mean: 142.8660888671875
nll mean: 132.76809692382812 	 kl mean: 9.616434097290039 	 loss mean: 142.384521484375
nll mean: 132.71751403808594 	 kl mean: 9.616434097290039 	 loss mean: 142.33395385742188


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
100%|██████████| 10/10 [00:00<00:00, 24.76it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.74it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.74it/s]
 20%|██        | 2/10 [00:00<00:00, 12.51it/s][A

nll mean: 132.92922973632812 	 kl mean: 9.616434097290039 	 loss mean: 142.54566955566406
nll mean: 127.18788146972656 	 kl mean: 10.630464553833008 	 loss mean: 137.81834411621094
nll mean: 127.59784698486328 	 kl mean: 10.630464553833008 	 loss mean: 138.22830200195312



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.64it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A

nll mean: 127.78355407714844 	 kl mean: 10.630464553833008 	 loss mean: 138.4140167236328
nll mean: 127.3238754272461 	 kl mean: 10.630464553833008 	 loss mean: 137.954345703125
nll mean: 128.23406982421875 	 kl mean: 10.630464553833008 	 loss mean: 138.86453247070312



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.64it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.74it/s][A

nll mean: 127.41402435302734 	 kl mean: 10.630464553833008 	 loss mean: 138.0444793701172
nll mean: 127.57667541503906 	 kl mean: 10.630464553833008 	 loss mean: 138.20713806152344
nll mean: 127.45122528076172 	 kl mean: 10.630464553833008 	 loss mean: 138.08169555664062



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.74it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]

nll mean: 127.3104248046875 	 kl mean: 10.630464553833008 	 loss mean: 137.94088745117188
nll mean: 127.55796813964844 	 kl mean: 10.630464553833008 	 loss mean: 138.1884307861328
nll mean: 145.3743896484375 	 kl mean: 9.864140510559082 	 loss mean: 155.238525390625



                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 12.73it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.57it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.61it/s][A

nll mean: 145.09515380859375 	 kl mean: 9.864140510559082 	 loss mean: 154.95928955078125
nll mean: 145.37039184570312 	 kl mean: 9.864140510559082 	 loss mean: 155.23452758789062
nll mean: 145.1400604248047 	 kl mean: 9.864140510559082 	 loss mean: 155.00421142578125



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.58it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s][A

nll mean: 145.58697509765625 	 kl mean: 9.864140510559082 	 loss mean: 155.45111083984375
nll mean: 145.60670471191406 	 kl mean: 9.864140510559082 	 loss mean: 155.47085571289062
nll mean: 145.29818725585938 	 kl mean: 9.864140510559082 	 loss mean: 155.16232299804688



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.51it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.57it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.44it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 144.92794799804688 	 kl mean: 9.864140510559082 	 loss mean: 154.79209899902344
nll mean: 145.26022338867188 	 kl mean: 9.864140510559082 	 loss mean: 155.12435913085938
nll mean: 145.56753540039062 	 kl mean: 9.864140510559082 	 loss mean: 155.43167114257812


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 20%|██        | 2/10 [00:00<00:00, 12.62it/s][A

nll mean: 154.62490844726562 	 kl mean: 10.015377044677734 	 loss mean: 164.64028930664062
nll mean: 153.993408203125 	 kl mean: 10.015377044677734 	 loss mean: 164.0087890625
nll mean: 154.27023315429688 	 kl mean: 10.015377044677734 	 loss mean: 164.28561401367188


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 20%|██        | 2/10 [00:00<00:00, 12.62it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 40%|████      | 4/10 [00:00<00:00, 12.58it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.52it/s][A

nll mean: 153.76541137695312 	 kl mean: 10.015377044677734 	 loss mean: 163.78079223632812
nll mean: 154.2169189453125 	 kl mean: 10.015377044677734 	 loss mean: 164.2322998046875
nll mean: 154.681884765625 	 kl mean: 10.015377044677734 	 loss mean: 164.69725036621094


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.52it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.47it/s][A

nll mean: 154.20309448242188 	 kl mean: 10.015377044677734 	 loss mean: 164.21849060058594
nll mean: 154.6536407470703 	 kl mean: 10.015377044677734 	 loss mean: 164.66900634765625
nll mean: 154.299560546875 	 kl mean: 10.015377044677734 	 loss mean: 164.31494140625


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.47it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.42it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 10.39it/s][A

nll mean: 153.72665405273438 	 kl mean: 10.015377044677734 	 loss mean: 163.74203491210938
nll mean: 116.64727783203125 	 kl mean: 9.965492248535156 	 loss mean: 126.61276245117188
nll mean: 116.0032958984375 	 kl mean: 9.965492248535156 	 loss mean: 125.96880340576172



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.40it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.27it/s][A

nll mean: 116.74136352539062 	 kl mean: 9.965492248535156 	 loss mean: 126.70684814453125
nll mean: 116.78636169433594 	 kl mean: 9.965492248535156 	 loss mean: 126.75184631347656
nll mean: 117.01239013671875 	 kl mean: 9.965492248535156 	 loss mean: 126.97787475585938



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.23it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s][A

nll mean: 116.33391571044922 	 kl mean: 9.965492248535156 	 loss mean: 126.29940795898438
nll mean: 116.65869140625 	 kl mean: 9.965492248535156 	 loss mean: 126.62419128417969
nll mean: 117.15507507324219 	 kl mean: 9.965492248535156 	 loss mean: 127.12057495117188



 80%|████████  | 8/10 [00:00<00:00, 10.16it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.22it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]

nll mean: 116.5490951538086 	 kl mean: 9.965492248535156 	 loss mean: 126.51458740234375
nll mean: 116.63672637939453 	 kl mean: 9.965492248535156 	 loss mean: 126.60221862792969
nll mean: 105.73393249511719 	 kl mean: 8.780094146728516 	 loss mean: 114.51403045654297
nll mean: 105.17265319824219 	 kl mean: 8.780094146728516 	 loss mean: 113.95275115966797
nll mean: 105.02757263183594 	 kl mean: 8.780094146728516 	 loss mean: 113.80767059326172



                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 33.48it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
 80%|████████  | 8/10 [00:00<00:00, 33.27it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 32.97it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 105.20409393310547 	 kl mean: 8.780094146728516 	 loss mean: 113.98419189453125
nll mean: 104.64802551269531 	 kl mean: 8.780094146728516 	 loss mean: 113.4281234741211
nll mean: 104.95665740966797 	 kl mean: 8.780094146728516 	 loss mean: 113.73675537109375
nll mean: 104.97932434082031 	 kl mean: 8.780094146728516 	 loss mean: 113.75941467285156
nll mean: 105.59046936035156 	 kl mean: 8.780094146728516 	 loss mean: 114.37055969238281
nll mean: 104.84878540039062 	 kl mean: 8.780094146728516 	 loss mean: 113.6288833618164
nll mean: 105.06288146972656 	 kl mean: 8.780094146728516 	 loss mean: 113.84297180175781



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.72it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A

nll mean: 155.50909423828125 	 kl mean: 9.866863250732422 	 loss mean: 165.37594604492188
nll mean: 155.70767211914062 	 kl mean: 9.866863250732422 	 loss mean: 165.57452392578125
nll mean: 155.91616821289062 	 kl mean: 9.866863250732422 	 loss mean: 165.78302001953125



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.72it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.63it/s][A

nll mean: 155.42282104492188 	 kl mean: 9.866863250732422 	 loss mean: 165.2896728515625
nll mean: 155.2680206298828 	 kl mean: 9.866863250732422 	 loss mean: 165.1348876953125
nll mean: 156.12728881835938 	 kl mean: 9.866863250732422 	 loss mean: 165.99415588378906



                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.64it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A

nll mean: 155.26852416992188 	 kl mean: 9.866863250732422 	 loss mean: 165.13539123535156
nll mean: 156.0679931640625 	 kl mean: 9.866863250732422 	 loss mean: 165.9348602294922
nll mean: 155.34274291992188 	 kl mean: 9.866863250732422 	 loss mean: 165.2095947265625



                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.61it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 22.59it/s][A

nll mean: 155.70806884765625 	 kl mean: 9.866863250732422 	 loss mean: 165.57493591308594
nll mean: 118.92386627197266 	 kl mean: 10.509109497070312 	 loss mean: 129.4329833984375
nll mean: 118.95361328125 	 kl mean: 10.509109497070312 	 loss mean: 129.46273803710938
nll mean: 118.09425354003906 	 kl mean: 10.509109497070312 	 loss mean: 128.6033477783203
nll mean: 118.857666015625 	 kl mean: 10.509109497070312 	 loss mean: 129.3667755126953


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 22.59it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.20it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.95it/s][A

nll mean: 118.94911193847656 	 kl mean: 10.509109497070312 	 loss mean: 129.45822143554688
nll mean: 118.51702117919922 	 kl mean: 10.509109497070312 	 loss mean: 129.02613830566406
nll mean: 118.34814453125 	 kl mean: 10.509109497070312 	 loss mean: 128.8572540283203
nll mean: 118.3260498046875 	 kl mean: 10.509109497070312 	 loss mean: 128.83514404296875
nll mean: 118.25611877441406 	 kl mean: 10.509109497070312 	 loss mean: 128.76522827148438


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 21.68it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 14.67it/s][A

nll mean: 118.9329605102539 	 kl mean: 10.509109497070312 	 loss mean: 129.44207763671875
nll mean: 112.61382293701172 	 kl mean: 9.177637100219727 	 loss mean: 121.79145812988281
nll mean: 112.56793212890625 	 kl mean: 9.177637100219727 	 loss mean: 121.74557495117188



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.76it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A

nll mean: 112.91910552978516 	 kl mean: 9.177637100219727 	 loss mean: 122.09674072265625
nll mean: 112.622314453125 	 kl mean: 9.177637100219727 	 loss mean: 121.79995727539062
nll mean: 112.34382629394531 	 kl mean: 9.177637100219727 	 loss mean: 121.52145385742188



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.68it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.74it/s][A

nll mean: 112.65397644042969 	 kl mean: 9.177637100219727 	 loss mean: 121.83161926269531
nll mean: 112.63177490234375 	 kl mean: 9.177637100219727 	 loss mean: 121.80941009521484
nll mean: 112.70852661132812 	 kl mean: 9.177637100219727 	 loss mean: 121.88615417480469



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.73it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               

nll mean: 113.20838928222656 	 kl mean: 9.177637100219727 	 loss mean: 122.38602447509766
nll mean: 112.3927001953125 	 kl mean: 9.177637100219727 	 loss mean: 121.57032775878906
nll mean: 80.55671691894531 	 kl mean: 9.03547477722168 	 loss mean: 89.5921859741211
nll mean: 80.46365356445312 	 kl mean: 9.03547477722168 	 loss mean: 89.49913024902344



 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00, 23.09it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.63it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s][A

nll mean: 80.416259765625 	 kl mean: 9.03547477722168 	 loss mean: 89.45173645019531
nll mean: 80.64222717285156 	 kl mean: 9.03547477722168 	 loss mean: 89.67769622802734
nll mean: 79.87760162353516 	 kl mean: 9.03547477722168 	 loss mean: 88.91307067871094
nll mean: 80.25099182128906 	 kl mean: 9.03547477722168 	 loss mean: 89.28646850585938
nll mean: 80.15984344482422 	 kl mean: 9.03547477722168 	 loss mean: 89.1953125
nll mean: 80.64630126953125 	 kl mean: 9.03547477722168 	 loss mean: 89.68177795410156



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.47it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 22.20it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.58it/s][A

nll mean: 80.54927062988281 	 kl mean: 9.03547477722168 	 loss mean: 89.5847396850586
nll mean: 80.63634490966797 	 kl mean: 9.03547477722168 	 loss mean: 89.67182922363281
nll mean: 106.73905944824219 	 kl mean: 9.19906997680664 	 loss mean: 115.93812561035156
nll mean: 106.42881774902344 	 kl mean: 9.19906997680664 	 loss mean: 115.62788391113281
nll mean: 106.77549743652344 	 kl mean: 9.19906997680664 	 loss mean: 115.97456359863281



                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.59it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s][A

nll mean: 106.24520874023438 	 kl mean: 9.19906997680664 	 loss mean: 115.44429016113281
nll mean: 106.47136688232422 	 kl mean: 9.19906997680664 	 loss mean: 115.6704330444336
nll mean: 106.98373413085938 	 kl mean: 9.19906997680664 	 loss mean: 116.18279266357422
nll mean: 106.30335998535156 	 kl mean: 9.19906997680664 	 loss mean: 115.50242614746094
nll mean: 106.34500885009766 	 kl mean: 9.19906997680664 	 loss mean: 115.54408264160156



                                               
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.72it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.70it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]

nll mean: 106.40486907958984 	 kl mean: 9.19906997680664 	 loss mean: 115.60394287109375
nll mean: 106.05169677734375 	 kl mean: 9.19906997680664 	 loss mean: 115.25076293945312
nll mean: 118.9752426147461 	 kl mean: 9.65126895904541 	 loss mean: 128.6265106201172



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s]
 20%|██        | 2/10 [00:00<00:00, 12.34it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.49it/s][A

nll mean: 118.0802001953125 	 kl mean: 9.65126895904541 	 loss mean: 127.73145294189453
nll mean: 118.09278869628906 	 kl mean: 9.65126895904541 	 loss mean: 127.74405670166016
nll mean: 118.17530822753906 	 kl mean: 9.65126895904541 	 loss mean: 127.82658386230469



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.48it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s][A

nll mean: 118.73062133789062 	 kl mean: 9.65126895904541 	 loss mean: 128.38189697265625
nll mean: 118.41551208496094 	 kl mean: 9.65126895904541 	 loss mean: 128.0667724609375
nll mean: 118.65292358398438 	 kl mean: 9.65126895904541 	 loss mean: 128.30419921875



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.47it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.85it/s][A
                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.85it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.48it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.58563232421875 	 kl mean: 9.65126895904541 	 loss mean: 128.23690795898438
nll mean: 118.04118347167969 	 kl mean: 9.65126895904541 	 loss mean: 127.69244384765625
nll mean: 119.10147094726562 	 kl mean: 9.65126895904541 	 loss mean: 128.75274658203125



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 10.00it/s][A
                                               
 20%|██        | 2/10 [00:00<00:00, 10.00it/s]

nll mean: 60.0008659362793 	 kl mean: 9.850790023803711 	 loss mean: 69.85165405273438
nll mean: 59.39756774902344 	 kl mean: 9.850790023803711 	 loss mean: 69.24836730957031
nll mean: 60.268672943115234 	 kl mean: 9.850790023803711 	 loss mean: 70.11946105957031


 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.02it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.99it/s][A

nll mean: 59.382904052734375 	 kl mean: 9.850790023803711 	 loss mean: 69.23369598388672
nll mean: 59.79231262207031 	 kl mean: 9.850790023803711 	 loss mean: 69.64310455322266



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.94it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.02it/s][A

nll mean: 59.74745559692383 	 kl mean: 9.850790023803711 	 loss mean: 69.5982437133789
nll mean: 60.33945083618164 	 kl mean: 9.850790023803711 	 loss mean: 70.19024658203125
nll mean: 59.68946075439453 	 kl mean: 9.850790023803711 	 loss mean: 69.54025268554688



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.05it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 59.84995651245117 	 kl mean: 9.850790023803711 	 loss mean: 69.70074462890625
nll mean: 59.71091842651367 	 kl mean: 9.850790023803711 	 loss mean: 69.56170654296875
nll mean: 102.56494140625 	 kl mean: 9.681859016418457 	 loss mean: 112.24681091308594


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 20%|██        | 2/10 [00:00<00:00, 12.98it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.76it/s][A

nll mean: 102.48265838623047 	 kl mean: 9.681859016418457 	 loss mean: 112.16451263427734
nll mean: 103.25381469726562 	 kl mean: 9.681859016418457 	 loss mean: 112.93567657470703
nll mean: 102.6918716430664 	 kl mean: 9.681859016418457 	 loss mean: 112.37372589111328


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 40%|████      | 4/10 [00:00<00:00, 12.76it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.67it/s][A

nll mean: 102.46875 	 kl mean: 9.681859016418457 	 loss mean: 112.1506118774414
nll mean: 102.48231506347656 	 kl mean: 9.681859016418457 	 loss mean: 112.1641845703125
nll mean: 102.77593994140625 	 kl mean: 9.681859016418457 	 loss mean: 112.45779418945312


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.67it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.62it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.58it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 102.28431701660156 	 kl mean: 9.681859016418457 	 loss mean: 111.96617126464844
nll mean: 102.1798095703125 	 kl mean: 9.681859016418457 	 loss mean: 111.8616714477539
nll mean: 102.32342529296875 	 kl mean: 9.681859016418457 	 loss mean: 112.00527954101562


                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.33it/s]
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 20%|██        | 2/10 [00:00<00:00, 10.12it/s][A

nll mean: 134.36875915527344 	 kl mean: 10.653377532958984 	 loss mean: 145.02212524414062
nll mean: 134.89752197265625 	 kl mean: 10.653377532958984 	 loss mean: 145.5509033203125
nll mean: 134.6678466796875 	 kl mean: 10.653377532958984 	 loss mean: 145.32122802734375


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 20%|██        | 2/10 [00:00<00:00, 10.12it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 40%|████      | 4/10 [00:00<00:00, 10.13it/s]

nll mean: 134.73379516601562 	 kl mean: 10.653377532958984 	 loss mean: 145.38717651367188
nll mean: 135.15267944335938 	 kl mean: 10.653377532958984 	 loss mean: 145.80606079101562
nll mean: 135.05584716796875 	 kl mean: 10.653377532958984 	 loss mean: 145.709228515625


[A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.11it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.05it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 10.06it/s]

nll mean: 134.5927276611328 	 kl mean: 10.653377532958984 	 loss mean: 145.24612426757812
nll mean: 134.45407104492188 	 kl mean: 10.653377532958984 	 loss mean: 145.10745239257812
nll mean: 134.53958129882812 	 kl mean: 10.653377532958984 	 loss mean: 145.19296264648438


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 90%|█████████ | 9/10 [00:00<00:00, 10.06it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.05it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
 30%|███       | 3/10 [00:00<00:00, 26.11it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A

nll mean: 134.84603881835938 	 kl mean: 10.653377532958984 	 loss mean: 145.49942016601562
nll mean: 63.9539680480957 	 kl mean: 8.47960376739502 	 loss mean: 72.4335708618164
nll mean: 63.59482192993164 	 kl mean: 8.47960376739502 	 loss mean: 72.07442474365234
nll mean: 63.765472412109375 	 kl mean: 8.47960376739502 	 loss mean: 72.24507141113281
nll mean: 63.80860137939453 	 kl mean: 8.47960376739502 	 loss mean: 72.2882080078125
nll mean: 63.93778610229492 	 kl mean: 8.47960376739502 	 loss mean: 72.41738891601562



                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.80it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.67it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.51it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 63.41870880126953 	 kl mean: 8.47960376739502 	 loss mean: 71.89830780029297
nll mean: 63.519954681396484 	 kl mean: 8.47960376739502 	 loss mean: 71.99955749511719
nll mean: 63.75501251220703 	 kl mean: 8.47960376739502 	 loss mean: 72.234619140625
nll mean: 64.14170837402344 	 kl mean: 8.47960376739502 	 loss mean: 72.6213150024414
nll mean: 63.51986312866211 	 kl mean: 8.47960376739502 	 loss mean: 71.99946594238281


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 30%|███       | 3/10 [00:00<00:00, 21.41it/s][A

nll mean: 117.77008819580078 	 kl mean: 9.461044311523438 	 loss mean: 127.23112487792969
nll mean: 117.24913024902344 	 kl mean: 9.461044311523438 	 loss mean: 126.71016693115234
nll mean: 117.33979034423828 	 kl mean: 9.461044311523438 	 loss mean: 126.80083465576172
nll mean: 117.55204010009766 	 kl mean: 9.461044311523438 	 loss mean: 127.0130844116211
nll mean: 117.19113159179688 	 kl mean: 9.461044311523438 	 loss mean: 126.65217590332031


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 30%|███       | 3/10 [00:00<00:00, 21.41it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.40it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
100%|██████████| 10/10 [00:00<00:00, 21.46it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 117.64646911621094 	 kl mean: 9.461044311523438 	 loss mean: 127.1075210571289
nll mean: 117.14934539794922 	 kl mean: 9.461044311523438 	 loss mean: 126.61039733886719
nll mean: 118.25772094726562 	 kl mean: 9.461044311523438 	 loss mean: 127.71876525878906
nll mean: 117.29379272460938 	 kl mean: 9.461044311523438 	 loss mean: 126.75483703613281
nll mean: 117.54335021972656 	 kl mean: 9.461044311523438 	 loss mean: 127.00439453125



                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 12.61it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s][A

nll mean: 117.799560546875 	 kl mean: 9.637514114379883 	 loss mean: 127.43707275390625
nll mean: 118.16287231445312 	 kl mean: 9.637514114379883 	 loss mean: 127.80038452148438
nll mean: 118.0198974609375 	 kl mean: 9.637514114379883 	 loss mean: 127.65740966796875



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.64it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.62it/s][A

nll mean: 118.16490173339844 	 kl mean: 9.637514114379883 	 loss mean: 127.80242156982422
nll mean: 118.3796615600586 	 kl mean: 9.637514114379883 	 loss mean: 128.01718139648438
nll mean: 118.41429901123047 	 kl mean: 9.637514114379883 	 loss mean: 128.05181884765625



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.62it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A

nll mean: 118.21861267089844 	 kl mean: 9.637514114379883 	 loss mean: 127.85613250732422
nll mean: 118.0374755859375 	 kl mean: 9.637514114379883 	 loss mean: 127.67498779296875
nll mean: 118.01365661621094 	 kl mean: 9.637514114379883 	 loss mean: 127.65116882324219



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.53it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s]
 20%|██        | 2/10 [00:00<00:00, 10.32it/s][A

nll mean: 118.67855072021484 	 kl mean: 9.637514114379883 	 loss mean: 128.31607055664062
nll mean: 113.18344116210938 	 kl mean: 9.532913208007812 	 loss mean: 122.71636199951172
nll mean: 113.4168930053711 	 kl mean: 9.532913208007812 	 loss mean: 122.94979858398438



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.34it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s][A

nll mean: 113.06610870361328 	 kl mean: 9.532913208007812 	 loss mean: 122.59902954101562
nll mean: 113.59521484375 	 kl mean: 9.532913208007812 	 loss mean: 123.12812805175781
nll mean: 112.95100402832031 	 kl mean: 9.532913208007812 	 loss mean: 122.48392486572266



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.43it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.45it/s][A

nll mean: 113.82899475097656 	 kl mean: 9.532913208007812 	 loss mean: 123.36190795898438
nll mean: 113.5384521484375 	 kl mean: 9.532913208007812 	 loss mean: 123.07136535644531
nll mean: 113.20771789550781 	 kl mean: 9.532913208007812 	 loss mean: 122.7406234741211



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.46it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]

nll mean: 113.11712646484375 	 kl mean: 9.532913208007812 	 loss mean: 122.65003967285156
nll mean: 112.84043884277344 	 kl mean: 9.532913208007812 	 loss mean: 122.37335205078125
nll mean: 110.38948059082031 	 kl mean: 9.53270149230957 	 loss mean: 119.92218017578125
nll mean: 110.45652770996094 	 kl mean: 9.53270149230957 	 loss mean: 119.98922729492188



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 22.71it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.90it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A

nll mean: 110.53358459472656 	 kl mean: 9.53270149230957 	 loss mean: 120.0662841796875
nll mean: 110.6351318359375 	 kl mean: 9.53270149230957 	 loss mean: 120.16783905029297
nll mean: 110.97593688964844 	 kl mean: 9.53270149230957 	 loss mean: 120.50863647460938
nll mean: 111.15638732910156 	 kl mean: 9.53270149230957 	 loss mean: 120.68909454345703
nll mean: 110.38624572753906 	 kl mean: 9.53270149230957 	 loss mean: 119.9189453125



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.89it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.23it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 111.059326171875 	 kl mean: 9.53270149230957 	 loss mean: 120.59202575683594
nll mean: 110.40328979492188 	 kl mean: 9.53270149230957 	 loss mean: 119.93599700927734
nll mean: 110.40007019042969 	 kl mean: 9.53270149230957 	 loss mean: 119.93277740478516
nll mean: 85.19773864746094 	 kl mean: 9.9745512008667 	 loss mean: 95.17229461669922
nll mean: 85.85222625732422 	 kl mean: 9.9745512008667 	 loss mean: 95.82677459716797
nll mean: 85.12705993652344 	 kl mean: 9.9745512008667 	 loss mean: 95.10159301757812


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 30.91it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
100%|██████████| 10/10 [00:00<00:00, 30.63it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.56it/s]

nll mean: 85.21764373779297 	 kl mean: 9.9745512008667 	 loss mean: 95.19219970703125
nll mean: 85.11031341552734 	 kl mean: 9.9745512008667 	 loss mean: 95.08486938476562
nll mean: 84.96333312988281 	 kl mean: 9.9745512008667 	 loss mean: 94.93788146972656
nll mean: 85.06260681152344 	 kl mean: 9.9745512008667 	 loss mean: 95.03715515136719
nll mean: 85.32870483398438 	 kl mean: 9.9745512008667 	 loss mean: 95.30325317382812
nll mean: 84.83598327636719 	 kl mean: 9.9745512008667 	 loss mean: 94.81053161621094
nll mean: 85.286376953125 	 kl mean: 9.9745512008667 	 loss mean: 95.26092529296875
Approximate NLL:





tensor(119.7677, device='cuda:0')
Approximate KL:
tensor(9.7394, device='cuda:0')
Testing took 0:00:25.265878


  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 25.81it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].81it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].81it/s][A

nll mean: 108.26362609863281 	 kl mean: 10.015586853027344 	 loss mean: 118.27921295166016
nll mean: 108.39762878417969 	 kl mean: 10.015586853027344 	 loss mean: 118.4132080078125
nll mean: 108.74920654296875 	 kl mean: 10.015586853027344 	 loss mean: 118.76478576660156
nll mean: 108.35527801513672 	 kl mean: 10.015586853027344 	 loss mean: 118.37086486816406
nll mean: 109.02265930175781 	 kl mean: 10.015586853027344 	 loss mean: 119.03823852539062



                                              
  0%|          | 0/38 [00:00<?, ?it/s].81it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.45it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].45it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].45it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].45it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.30it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 25.08it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 108.73766326904297 	 kl mean: 10.015586853027344 	 loss mean: 118.75325775146484
nll mean: 108.60005187988281 	 kl mean: 10.015586853027344 	 loss mean: 118.61563873291016
nll mean: 108.8737564086914 	 kl mean: 10.015586853027344 	 loss mean: 118.88934326171875
nll mean: 108.70901489257812 	 kl mean: 10.015586853027344 	 loss mean: 118.72460174560547
nll mean: 108.60480499267578 	 kl mean: 10.015586853027344 	 loss mean: 118.62039184570312


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 20%|██        | 2/10 [00:00<00:00, 13.94it/s][A

nll mean: 125.21040344238281 	 kl mean: 9.90673828125 	 loss mean: 135.1171417236328
nll mean: 125.338623046875 	 kl mean: 9.90673828125 	 loss mean: 135.245361328125
nll mean: 124.82086181640625 	 kl mean: 9.90673828125 	 loss mean: 134.72760009765625


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 20%|██        | 2/10 [00:00<00:00, 13.94it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 40%|████      | 4/10 [00:00<00:00, 13.84it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.84it/s][A

nll mean: 125.18153381347656 	 kl mean: 9.90673828125 	 loss mean: 135.08828735351562
nll mean: 125.52982330322266 	 kl mean: 9.90673828125 	 loss mean: 135.43655395507812
nll mean: 125.16300964355469 	 kl mean: 9.90673828125 	 loss mean: 135.06973266601562


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.84it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.90it/s][A

nll mean: 125.38813781738281 	 kl mean: 9.90673828125 	 loss mean: 135.2948760986328
nll mean: 124.91839599609375 	 kl mean: 9.90673828125 	 loss mean: 134.82513427734375
nll mean: 125.27687072753906 	 kl mean: 9.90673828125 	 loss mean: 135.18360900878906


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.90it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.92it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 24.39it/s][A

nll mean: 125.150146484375 	 kl mean: 9.90673828125 	 loss mean: 135.056884765625
nll mean: 98.80097961425781 	 kl mean: 9.021628379821777 	 loss mean: 107.8226089477539
nll mean: 98.57418823242188 	 kl mean: 9.021628379821777 	 loss mean: 107.5958251953125
nll mean: 98.31462097167969 	 kl mean: 9.021628379821777 	 loss mean: 107.33625793457031
nll mean: 98.15196228027344 	 kl mean: 9.021628379821777 	 loss mean: 107.17359924316406


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 24.39it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.27it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.34it/s][A

nll mean: 97.8993148803711 	 kl mean: 9.021628379821777 	 loss mean: 106.92094421386719
nll mean: 98.16351318359375 	 kl mean: 9.021628379821777 	 loss mean: 107.18513488769531
nll mean: 98.70965576171875 	 kl mean: 9.021628379821777 	 loss mean: 107.73127746582031
nll mean: 98.58232879638672 	 kl mean: 9.021628379821777 	 loss mean: 107.60395812988281
nll mean: 98.39676666259766 	 kl mean: 9.021628379821777 	 loss mean: 107.41839599609375


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
100%|██████████| 10/10 [00:00<00:00, 24.23it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
 20%|██        | 2/10 [00:00<00:00, 10.88it/s][A

nll mean: 98.88446044921875 	 kl mean: 9.021628379821777 	 loss mean: 107.90608215332031
nll mean: 137.94155883789062 	 kl mean: 9.828103065490723 	 loss mean: 147.7696533203125
nll mean: 137.56268310546875 	 kl mean: 9.828103065490723 	 loss mean: 147.39077758789062



                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.88it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s][A

nll mean: 137.3766632080078 	 kl mean: 9.828103065490723 	 loss mean: 147.2047576904297
nll mean: 137.76486206054688 	 kl mean: 9.828103065490723 	 loss mean: 147.59295654296875
nll mean: 137.54852294921875 	 kl mean: 9.828103065490723 	 loss mean: 147.37661743164062



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.88it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.85it/s][A

nll mean: 137.65487670898438 	 kl mean: 9.828103065490723 	 loss mean: 147.48297119140625
nll mean: 137.506103515625 	 kl mean: 9.828103065490723 	 loss mean: 147.33419799804688
nll mean: 137.89773559570312 	 kl mean: 9.828103065490723 	 loss mean: 147.72584533691406



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.82it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]

nll mean: 138.240234375 	 kl mean: 9.828103065490723 	 loss mean: 148.06832885742188
nll mean: 137.73233032226562 	 kl mean: 9.828103065490723 	 loss mean: 147.5604248046875
nll mean: 124.7295913696289 	 kl mean: 9.428552627563477 	 loss mean: 134.15814208984375



                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 20%|██        | 2/10 [00:00<00:00, 13.46it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.65it/s][A

nll mean: 124.80935668945312 	 kl mean: 9.428552627563477 	 loss mean: 134.2379150390625
nll mean: 124.54574584960938 	 kl mean: 9.428552627563477 	 loss mean: 133.9742889404297
nll mean: 123.98489379882812 	 kl mean: 9.428552627563477 	 loss mean: 133.4134521484375



                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.84it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A

nll mean: 124.06000518798828 	 kl mean: 9.428552627563477 	 loss mean: 133.48854064941406
nll mean: 124.4969482421875 	 kl mean: 9.428552627563477 	 loss mean: 133.92550659179688
nll mean: 124.44426727294922 	 kl mean: 9.428552627563477 	 loss mean: 133.87281799316406



                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.81it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.95it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.55171966552734 	 kl mean: 9.428552627563477 	 loss mean: 133.98025512695312
nll mean: 124.97100830078125 	 kl mean: 9.428552627563477 	 loss mean: 134.39956665039062
nll mean: 124.08776092529297 	 kl mean: 9.428552627563477 	 loss mean: 133.51632690429688



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.52it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 122.3511962890625 	 kl mean: 9.341819763183594 	 loss mean: 131.69300842285156
nll mean: 121.49041748046875 	 kl mean: 9.341819763183594 	 loss mean: 130.83224487304688
nll mean: 121.93159484863281 	 kl mean: 9.341819763183594 	 loss mean: 131.27340698242188



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.43it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.22it/s][A

nll mean: 122.15936279296875 	 kl mean: 9.341819763183594 	 loss mean: 131.50119018554688
nll mean: 122.42411041259766 	 kl mean: 9.341819763183594 	 loss mean: 131.76593017578125
nll mean: 122.17146301269531 	 kl mean: 9.341819763183594 	 loss mean: 131.51327514648438



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.17it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 121.71177673339844 	 kl mean: 9.341819763183594 	 loss mean: 131.05360412597656
nll mean: 122.07456970214844 	 kl mean: 9.341819763183594 	 loss mean: 131.4163818359375
nll mean: 122.55001068115234 	 kl mean: 9.341819763183594 	 loss mean: 131.891845703125



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.13it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.19it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A

nll mean: 121.951904296875 	 kl mean: 9.341819763183594 	 loss mean: 131.29373168945312
nll mean: 131.59033203125 	 kl mean: 9.268889427185059 	 loss mean: 140.85922241210938
nll mean: 131.5726776123047 	 kl mean: 9.268889427185059 	 loss mean: 140.84156799316406
nll mean: 131.39146423339844 	 kl mean: 9.268889427185059 	 loss mean: 140.6603546142578
nll mean: 131.60256958007812 	 kl mean: 9.268889427185059 	 loss mean: 140.8714599609375



                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.95it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.89it/s][A

nll mean: 131.39810180664062 	 kl mean: 9.268889427185059 	 loss mean: 140.6669921875
nll mean: 131.59454345703125 	 kl mean: 9.268889427185059 	 loss mean: 140.86343383789062
nll mean: 131.59523010253906 	 kl mean: 9.268889427185059 	 loss mean: 140.86412048339844
nll mean: 131.16171264648438 	 kl mean: 9.268889427185059 	 loss mean: 140.43060302734375
nll mean: 131.9605712890625 	 kl mean: 9.268889427185059 	 loss mean: 141.22946166992188



                                              
100%|██████████| 10/10 [00:00<00:00, 24.69it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 24.97it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A

nll mean: 131.33969116210938 	 kl mean: 9.268889427185059 	 loss mean: 140.60858154296875
nll mean: 104.97772216796875 	 kl mean: 9.136292457580566 	 loss mean: 114.11402130126953
nll mean: 104.79998779296875 	 kl mean: 9.136292457580566 	 loss mean: 113.93627166748047
nll mean: 104.64271545410156 	 kl mean: 9.136292457580566 	 loss mean: 113.77900695800781
nll mean: 105.20854187011719 	 kl mean: 9.136292457580566 	 loss mean: 114.3448257446289



                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.95it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.81it/s][A

nll mean: 104.4050521850586 	 kl mean: 9.136292457580566 	 loss mean: 113.54133605957031
nll mean: 104.5711669921875 	 kl mean: 9.136292457580566 	 loss mean: 113.70745849609375
nll mean: 104.7191162109375 	 kl mean: 9.136292457580566 	 loss mean: 113.85540771484375
nll mean: 104.3302230834961 	 kl mean: 9.136292457580566 	 loss mean: 113.46650695800781
nll mean: 104.92440795898438 	 kl mean: 9.136292457580566 	 loss mean: 114.06069946289062



                                              
100%|██████████| 10/10 [00:00<00:00, 24.75it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
 20%|██        | 2/10 [00:00<00:00, 14.77it/s][A

nll mean: 104.37004852294922 	 kl mean: 9.136292457580566 	 loss mean: 113.50633239746094
nll mean: 130.4666748046875 	 kl mean: 9.708792686462402 	 loss mean: 140.1754608154297
nll mean: 130.84878540039062 	 kl mean: 9.708792686462402 	 loss mean: 140.55758666992188



                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.62it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
 60%|██████    | 6/10 [00:00<00:00, 15.01it/s][A

nll mean: 131.03187561035156 	 kl mean: 9.708792686462402 	 loss mean: 140.7406768798828
nll mean: 130.89462280273438 	 kl mean: 9.708792686462402 	 loss mean: 140.60342407226562
nll mean: 130.42343139648438 	 kl mean: 9.708792686462402 	 loss mean: 140.13223266601562
nll mean: 130.57473754882812 	 kl mean: 9.708792686462402 	 loss mean: 140.28353881835938



                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.99it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
                                              
 80%|████████  | 8/10 [00:00<00:00, 14.99it/s][A

nll mean: 130.76052856445312 	 kl mean: 9.708792686462402 	 loss mean: 140.4693145751953
nll mean: 130.35964965820312 	 kl mean: 9.708792686462402 	 loss mean: 140.06845092773438
nll mean: 130.68157958984375 	 kl mean: 9.708792686462402 	 loss mean: 140.390380859375
nll mean: 130.31182861328125 	 kl mean: 9.708792686462402 	 loss mean: 140.02061462402344


 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
100%|██████████| 10/10 [00:00<00:00, 14.98it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.99it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s][A

nll mean: 129.45985412597656 	 kl mean: 9.642881393432617 	 loss mean: 139.10272216796875
nll mean: 129.5396728515625 	 kl mean: 9.642881393432617 	 loss mean: 139.18255615234375
nll mean: 129.342041015625 	 kl mean: 9.642881393432617 	 loss mean: 138.98492431640625
nll mean: 129.3918914794922 	 kl mean: 9.642881393432617 	 loss mean: 139.03475952148438
nll mean: 129.3085174560547 	 kl mean: 9.642881393432617 	 loss mean: 138.951416015625



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.68it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.49it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 21.24it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 129.43795776367188 	 kl mean: 9.642881393432617 	 loss mean: 139.08084106445312
nll mean: 129.544189453125 	 kl mean: 9.642881393432617 	 loss mean: 139.1870574951172
nll mean: 129.33795166015625 	 kl mean: 9.642881393432617 	 loss mean: 138.98081970214844
nll mean: 129.21136474609375 	 kl mean: 9.642881393432617 	 loss mean: 138.85423278808594
nll mean: 129.40773010253906 	 kl mean: 9.642881393432617 	 loss mean: 139.05062866210938



                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
 30%|███       | 3/10 [00:00<00:00, 24.87it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s][A

nll mean: 115.82341003417969 	 kl mean: 9.665802001953125 	 loss mean: 125.48921203613281
nll mean: 115.9903335571289 	 kl mean: 9.665802001953125 	 loss mean: 125.65614318847656
nll mean: 115.7706069946289 	 kl mean: 9.665802001953125 	 loss mean: 125.43640899658203
nll mean: 116.07485961914062 	 kl mean: 9.665802001953125 	 loss mean: 125.74066162109375
nll mean: 116.00093841552734 	 kl mean: 9.665802001953125 	 loss mean: 125.666748046875



                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.69it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.49it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 24.27it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 115.90817260742188 	 kl mean: 9.665802001953125 	 loss mean: 125.57396697998047
nll mean: 116.21784973144531 	 kl mean: 9.665802001953125 	 loss mean: 125.8836441040039
nll mean: 115.77783966064453 	 kl mean: 9.665802001953125 	 loss mean: 125.44364166259766
nll mean: 115.75413513183594 	 kl mean: 9.665802001953125 	 loss mean: 125.41993713378906
nll mean: 116.21176147460938 	 kl mean: 9.665802001953125 	 loss mean: 125.87757110595703



                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
 30%|███       | 3/10 [00:00<00:00, 20.91it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A

nll mean: 140.34707641601562 	 kl mean: 9.595101356506348 	 loss mean: 149.9421844482422
nll mean: 140.34829711914062 	 kl mean: 9.595101356506348 	 loss mean: 149.94338989257812
nll mean: 139.84359741210938 	 kl mean: 9.595101356506348 	 loss mean: 149.43869018554688
nll mean: 140.21421813964844 	 kl mean: 9.595101356506348 	 loss mean: 149.809326171875
nll mean: 140.1124267578125 	 kl mean: 9.595101356506348 	 loss mean: 149.70751953125



                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.04it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.03it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 20.97it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 140.33876037597656 	 kl mean: 9.595101356506348 	 loss mean: 149.93386840820312
nll mean: 139.7009735107422 	 kl mean: 9.595101356506348 	 loss mean: 149.29608154296875
nll mean: 140.0540771484375 	 kl mean: 9.595101356506348 	 loss mean: 149.649169921875
nll mean: 139.89117431640625 	 kl mean: 9.595101356506348 	 loss mean: 149.4862823486328
nll mean: 140.2691650390625 	 kl mean: 9.595101356506348 	 loss mean: 149.8642578125



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
 20%|██        | 2/10 [00:00<00:00, 12.53it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s][A

nll mean: 118.5006332397461 	 kl mean: 10.021093368530273 	 loss mean: 128.521728515625
nll mean: 118.59867858886719 	 kl mean: 10.021093368530273 	 loss mean: 128.61978149414062
nll mean: 118.50619506835938 	 kl mean: 10.021093368530273 	 loss mean: 128.52728271484375



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.57it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.54it/s][A

nll mean: 118.9243392944336 	 kl mean: 10.021093368530273 	 loss mean: 128.9454345703125
nll mean: 119.3718032836914 	 kl mean: 10.021093368530273 	 loss mean: 129.39288330078125
nll mean: 119.6085433959961 	 kl mean: 10.021093368530273 	 loss mean: 129.629638671875



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.60it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A

nll mean: 118.22523498535156 	 kl mean: 10.021093368530273 	 loss mean: 128.24632263183594
nll mean: 118.7545166015625 	 kl mean: 10.021093368530273 	 loss mean: 128.77561950683594
nll mean: 118.7790298461914 	 kl mean: 10.021093368530273 	 loss mean: 128.8001251220703



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.56it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]


nll mean: 118.47618865966797 	 kl mean: 10.021093368530273 	 loss mean: 128.49728393554688
nll mean: 158.14678955078125 	 kl mean: 10.581856727600098 	 loss mean: 168.7286376953125


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
 20%|██        | 2/10 [00:00<00:00, 10.06it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.99it/s][A

nll mean: 158.72817993164062 	 kl mean: 10.581856727600098 	 loss mean: 169.31002807617188
nll mean: 159.21563720703125 	 kl mean: 10.581856727600098 	 loss mean: 169.7974853515625



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.94it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
[A                                           

nll mean: 158.42483520507812 	 kl mean: 10.581856727600098 	 loss mean: 169.0067138671875
nll mean: 159.1554718017578 	 kl mean: 10.581856727600098 	 loss mean: 169.73731994628906


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.94it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.90it/s][A
                                              

nll mean: 158.9864501953125 	 kl mean: 10.581856727600098 	 loss mean: 169.56829833984375
nll mean: 159.03302001953125 	 kl mean: 10.581856727600098 	 loss mean: 169.61489868164062


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.92it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.92it/s][A

nll mean: 158.97348022460938 	 kl mean: 10.581856727600098 	 loss mean: 169.55532836914062
nll mean: 158.90264892578125 	 kl mean: 10.581856727600098 	 loss mean: 169.4844970703125



                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.90it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.53it/s][A

nll mean: 158.38232421875 	 kl mean: 10.581856727600098 	 loss mean: 168.96417236328125
nll mean: 133.17898559570312 	 kl mean: 9.305950164794922 	 loss mean: 142.4849395751953
nll mean: 132.84361267089844 	 kl mean: 9.305950164794922 	 loss mean: 142.14956665039062
nll mean: 133.40245056152344 	 kl mean: 9.305950164794922 	 loss mean: 142.70840454101562


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.53it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 18.28it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 18.19it/s][A

nll mean: 133.38543701171875 	 kl mean: 9.305950164794922 	 loss mean: 142.69137573242188
nll mean: 133.3722686767578 	 kl mean: 9.305950164794922 	 loss mean: 142.67820739746094
nll mean: 133.0718994140625 	 kl mean: 9.305950164794922 	 loss mean: 142.3778533935547
nll mean: 133.12045288085938 	 kl mean: 9.305950164794922 	 loss mean: 142.42642211914062


                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 18.19it/s][A
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 18.06it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.99it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 133.234619140625 	 kl mean: 9.305950164794922 	 loss mean: 142.54058837890625
nll mean: 132.6678466796875 	 kl mean: 9.305950164794922 	 loss mean: 141.97381591796875
nll mean: 133.91087341308594 	 kl mean: 9.305950164794922 	 loss mean: 143.21682739257812



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 20%|██        | 2/10 [00:00<00:00, 10.74it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A

nll mean: 141.46600341796875 	 kl mean: 10.098394393920898 	 loss mean: 151.56439208984375
nll mean: 140.8566131591797 	 kl mean: 10.098394393920898 	 loss mean: 150.95498657226562
nll mean: 141.4318389892578 	 kl mean: 10.098394393920898 	 loss mean: 151.53024291992188



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.77it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.78it/s][A

nll mean: 140.89089965820312 	 kl mean: 10.098394393920898 	 loss mean: 150.9893035888672
nll mean: 141.7572479248047 	 kl mean: 10.098394393920898 	 loss mean: 151.8556365966797
nll mean: 141.42364501953125 	 kl mean: 10.098394393920898 	 loss mean: 151.5220489501953



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.76it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s][A

nll mean: 141.4706268310547 	 kl mean: 10.098394393920898 	 loss mean: 151.56903076171875
nll mean: 140.81802368164062 	 kl mean: 10.098394393920898 	 loss mean: 150.9164276123047
nll mean: 141.3571014404297 	 kl mean: 10.098394393920898 	 loss mean: 151.45547485351562



                                               
 39%|███▉      | 15/38 [00:10<00:15,  1.50it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.74it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 24.85it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A

nll mean: 140.97032165527344 	 kl mean: 10.098394393920898 	 loss mean: 151.06871032714844
nll mean: 142.71485900878906 	 kl mean: 9.137462615966797 	 loss mean: 151.85232543945312
nll mean: 143.02774047851562 	 kl mean: 9.137462615966797 	 loss mean: 152.1652069091797
nll mean: 142.92489624023438 	 kl mean: 9.137462615966797 	 loss mean: 152.06234741210938
nll mean: 142.82730102539062 	 kl mean: 9.137462615966797 	 loss mean: 151.96475219726562



                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.65it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.58it/s][A

nll mean: 142.79833984375 	 kl mean: 9.137462615966797 	 loss mean: 151.935791015625
nll mean: 142.5211181640625 	 kl mean: 9.137462615966797 	 loss mean: 151.65858459472656
nll mean: 142.75643920898438 	 kl mean: 9.137462615966797 	 loss mean: 151.89390563964844
nll mean: 142.9083709716797 	 kl mean: 9.137462615966797 	 loss mean: 152.0458221435547
nll mean: 142.51939392089844 	 kl mean: 9.137462615966797 	 loss mean: 151.65684509277344



                                               
100%|██████████| 10/10 [00:00<00:00, 24.35it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 30%|███       | 3/10 [00:00<00:00, 24.42it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A

nll mean: 142.78973388671875 	 kl mean: 9.137462615966797 	 loss mean: 151.9272003173828
nll mean: 131.69961547851562 	 kl mean: 9.54057502746582 	 loss mean: 141.24017333984375
nll mean: 132.27029418945312 	 kl mean: 9.54057502746582 	 loss mean: 141.81085205078125
nll mean: 132.03712463378906 	 kl mean: 9.54057502746582 	 loss mean: 141.57769775390625
nll mean: 132.24879455566406 	 kl mean: 9.54057502746582 	 loss mean: 141.78936767578125



                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.49it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.46it/s][A

nll mean: 132.35452270507812 	 kl mean: 9.54057502746582 	 loss mean: 141.8950958251953
nll mean: 132.24374389648438 	 kl mean: 9.54057502746582 	 loss mean: 141.7843017578125
nll mean: 132.1547393798828 	 kl mean: 9.54057502746582 	 loss mean: 141.6953125
nll mean: 132.19049072265625 	 kl mean: 9.54057502746582 	 loss mean: 141.7310791015625
nll mean: 132.33494567871094 	 kl mean: 9.54057502746582 	 loss mean: 141.87551879882812



                                               
100%|██████████| 10/10 [00:00<00:00, 24.45it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 20%|██        | 2/10 [00:00<00:00, 12.52it/s][A

nll mean: 132.65139770507812 	 kl mean: 9.54057502746582 	 loss mean: 142.19198608398438
nll mean: 126.67768859863281 	 kl mean: 10.357614517211914 	 loss mean: 137.03530883789062
nll mean: 126.67211151123047 	 kl mean: 10.357614517211914 	 loss mean: 137.02972412109375



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.58it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A

nll mean: 127.43891906738281 	 kl mean: 10.357614517211914 	 loss mean: 137.79652404785156
nll mean: 127.10637664794922 	 kl mean: 10.357614517211914 	 loss mean: 137.4639892578125
nll mean: 126.90035247802734 	 kl mean: 10.357614517211914 	 loss mean: 137.25796508789062



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.62it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A

nll mean: 127.09549713134766 	 kl mean: 10.357614517211914 	 loss mean: 137.453125
nll mean: 127.1681137084961 	 kl mean: 10.357614517211914 	 loss mean: 137.52572631835938
nll mean: 126.80537414550781 	 kl mean: 10.357614517211914 	 loss mean: 137.16299438476562



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.51it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]

nll mean: 127.00575256347656 	 kl mean: 10.357614517211914 	 loss mean: 137.36337280273438
nll mean: 127.59762573242188 	 kl mean: 10.357614517211914 	 loss mean: 137.95523071289062
nll mean: 146.32049560546875 	 kl mean: 9.892324447631836 	 loss mean: 156.2128143310547



                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 12.60it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.58it/s][A

nll mean: 146.222900390625 	 kl mean: 9.892324447631836 	 loss mean: 156.115234375
nll mean: 146.4161376953125 	 kl mean: 9.892324447631836 	 loss mean: 156.30845642089844
nll mean: 146.2470245361328 	 kl mean: 9.892324447631836 	 loss mean: 156.13934326171875



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.54it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A

nll mean: 146.42617797851562 	 kl mean: 9.892324447631836 	 loss mean: 156.3184814453125
nll mean: 146.18653869628906 	 kl mean: 9.892324447631836 	 loss mean: 156.078857421875
nll mean: 146.3623046875 	 kl mean: 9.892324447631836 	 loss mean: 156.25462341308594



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.41it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.42it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 146.63485717773438 	 kl mean: 9.892324447631836 	 loss mean: 156.5271759033203
nll mean: 146.2630615234375 	 kl mean: 9.892324447631836 	 loss mean: 156.1553955078125
nll mean: 146.37265014648438 	 kl mean: 9.892324447631836 	 loss mean: 156.26498413085938



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 20%|██        | 2/10 [00:00<00:00, 12.61it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A

nll mean: 154.33030700683594 	 kl mean: 9.393508911132812 	 loss mean: 163.72381591796875
nll mean: 154.3751983642578 	 kl mean: 9.393508911132812 	 loss mean: 163.76870727539062
nll mean: 154.21377563476562 	 kl mean: 9.393508911132812 	 loss mean: 163.60728454589844



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.59it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.62it/s][A

nll mean: 153.938232421875 	 kl mean: 9.393508911132812 	 loss mean: 163.33172607421875
nll mean: 154.27850341796875 	 kl mean: 9.393508911132812 	 loss mean: 163.67202758789062
nll mean: 154.8546142578125 	 kl mean: 9.393508911132812 	 loss mean: 164.24813842773438



                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.68it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A

nll mean: 154.82321166992188 	 kl mean: 9.393508911132812 	 loss mean: 164.21670532226562
nll mean: 154.32321166992188 	 kl mean: 9.393508911132812 	 loss mean: 163.7167205810547
nll mean: 154.3795928955078 	 kl mean: 9.393508911132812 	 loss mean: 163.77310180664062



                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.68it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 10.40it/s][A

nll mean: 154.32620239257812 	 kl mean: 9.393508911132812 	 loss mean: 163.71971130371094
nll mean: 116.51937866210938 	 kl mean: 9.537884712219238 	 loss mean: 126.05726623535156
nll mean: 116.9572982788086 	 kl mean: 9.537884712219238 	 loss mean: 126.49518585205078



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.36it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A

nll mean: 116.89325714111328 	 kl mean: 9.537884712219238 	 loss mean: 126.43113708496094
nll mean: 115.9775390625 	 kl mean: 9.537884712219238 	 loss mean: 125.51542663574219
nll mean: 116.81324768066406 	 kl mean: 9.537884712219238 	 loss mean: 126.35113525390625



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.36it/s][A

nll mean: 116.54045867919922 	 kl mean: 9.537884712219238 	 loss mean: 126.0783462524414
nll mean: 116.82041931152344 	 kl mean: 9.537884712219238 	 loss mean: 126.3582992553711
nll mean: 116.77489471435547 	 kl mean: 9.537884712219238 	 loss mean: 126.31278228759766



                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.34it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 116.17396545410156 	 kl mean: 9.537884712219238 	 loss mean: 125.71184539794922
nll mean: 116.09590148925781 	 kl mean: 9.537884712219238 	 loss mean: 125.6337890625
nll mean: 104.92343139648438 	 kl mean: 8.496099472045898 	 loss mean: 113.41952514648438
nll mean: 105.1090087890625 	 kl mean: 8.496099472045898 	 loss mean: 113.60511016845703
nll mean: 105.40284729003906 	 kl mean: 8.496099472045898 	 loss mean: 113.89894104003906


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
 40%|████      | 4/10 [00:00<00:00, 33.37it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.26it/s]
100%|██████████| 10/10 [00:00<00:00, 31.98it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 105.20724487304688 	 kl mean: 8.496099472045898 	 loss mean: 113.70333862304688
nll mean: 105.65603637695312 	 kl mean: 8.496099472045898 	 loss mean: 114.15213775634766
nll mean: 105.75180053710938 	 kl mean: 8.496099472045898 	 loss mean: 114.2479019165039
nll mean: 105.2650146484375 	 kl mean: 8.496099472045898 	 loss mean: 113.76111602783203
nll mean: 105.27134704589844 	 kl mean: 8.496099472045898 	 loss mean: 113.76744079589844
nll mean: 104.59843444824219 	 kl mean: 8.496099472045898 	 loss mean: 113.09453582763672
nll mean: 105.38395690917969 	 kl mean: 8.496099472045898 	 loss mean: 113.88004302978516


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.12it/s][A

nll mean: 155.30429077148438 	 kl mean: 9.543601989746094 	 loss mean: 164.847900390625
nll mean: 154.7250518798828 	 kl mean: 9.543601989746094 	 loss mean: 164.26864624023438
nll mean: 155.35189819335938 	 kl mean: 9.543601989746094 	 loss mean: 164.89549255371094


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.12it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 40%|████      | 4/10 [00:00<00:00, 14.17it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.21it/s][A

nll mean: 155.795166015625 	 kl mean: 9.543601989746094 	 loss mean: 165.33877563476562
nll mean: 155.2663116455078 	 kl mean: 9.543601989746094 	 loss mean: 164.80990600585938
nll mean: 155.23153686523438 	 kl mean: 9.543601989746094 	 loss mean: 164.775146484375


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.21it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.26it/s][A

nll mean: 155.49465942382812 	 kl mean: 9.543601989746094 	 loss mean: 165.0382537841797
nll mean: 154.8359375 	 kl mean: 9.543601989746094 	 loss mean: 164.37954711914062
nll mean: 154.53604125976562 	 kl mean: 9.543601989746094 	 loss mean: 164.07965087890625


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.26it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.26it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
 30%|███       | 3/10 [00:00<00:00, 21.24it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A

nll mean: 154.72760009765625 	 kl mean: 9.543601989746094 	 loss mean: 164.27120971679688
nll mean: 119.26835632324219 	 kl mean: 10.523256301879883 	 loss mean: 129.79161071777344
nll mean: 119.6546630859375 	 kl mean: 10.523256301879883 	 loss mean: 130.17791748046875
nll mean: 119.40155029296875 	 kl mean: 10.523256301879883 	 loss mean: 129.9248046875
nll mean: 119.42083740234375 	 kl mean: 10.523256301879883 	 loss mean: 129.944091796875



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.11it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.16it/s][A

nll mean: 119.68814849853516 	 kl mean: 10.523256301879883 	 loss mean: 130.21141052246094
nll mean: 119.19099426269531 	 kl mean: 10.523256301879883 	 loss mean: 129.71424865722656
nll mean: 119.88057708740234 	 kl mean: 10.523256301879883 	 loss mean: 130.40383911132812
nll mean: 119.67247009277344 	 kl mean: 10.523256301879883 	 loss mean: 130.19573974609375
nll mean: 119.63701629638672 	 kl mean: 10.523256301879883 	 loss mean: 130.1602783203125



                                               
100%|██████████| 10/10 [00:00<00:00, 21.17it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.64it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.64it/s]
 20%|██        | 2/10 [00:00<00:00, 14.66it/s][A

nll mean: 119.33973693847656 	 kl mean: 10.523256301879883 	 loss mean: 129.86297607421875
nll mean: 113.5257568359375 	 kl mean: 9.527853965759277 	 loss mean: 123.0536117553711
nll mean: 113.68254089355469 	 kl mean: 9.527853965759277 	 loss mean: 123.21038818359375



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.64it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.66it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s][A

nll mean: 113.69994354248047 	 kl mean: 9.527853965759277 	 loss mean: 123.22779083251953
nll mean: 113.61248779296875 	 kl mean: 9.527853965759277 	 loss mean: 123.14034271240234
nll mean: 113.70731353759766 	 kl mean: 9.527853965759277 	 loss mean: 123.23516082763672



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.73it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.74it/s][A
                                               

nll mean: 114.00094604492188 	 kl mean: 9.527853965759277 	 loss mean: 123.52880096435547
nll mean: 113.54299926757812 	 kl mean: 9.527853965759277 	 loss mean: 123.07084655761719
nll mean: 113.48114776611328 	 kl mean: 9.527853965759277 	 loss mean: 123.00900268554688



 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.78it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 23.23it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A

nll mean: 113.54331970214844 	 kl mean: 9.527853965759277 	 loss mean: 123.07117462158203
nll mean: 114.41228485107422 	 kl mean: 9.527853965759277 	 loss mean: 123.94013977050781
nll mean: 80.666259765625 	 kl mean: 8.345170974731445 	 loss mean: 89.01143646240234
nll mean: 80.52809143066406 	 kl mean: 8.345170974731445 	 loss mean: 88.8732681274414
nll mean: 80.60945129394531 	 kl mean: 8.345170974731445 	 loss mean: 88.95462799072266
nll mean: 80.30508422851562 	 kl mean: 8.345170974731445 	 loss mean: 88.65025329589844



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.72it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.40it/s][A

nll mean: 80.6863021850586 	 kl mean: 8.345170974731445 	 loss mean: 89.03146362304688
nll mean: 80.25353240966797 	 kl mean: 8.345170974731445 	 loss mean: 88.59870910644531
nll mean: 81.13004302978516 	 kl mean: 8.345170974731445 	 loss mean: 89.4752197265625
nll mean: 81.15940856933594 	 kl mean: 8.345170974731445 	 loss mean: 89.50458526611328
nll mean: 80.60806274414062 	 kl mean: 8.345170974731445 	 loss mean: 88.95323181152344



                                               
100%|██████████| 10/10 [00:00<00:00, 22.18it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 22.23it/s][A

nll mean: 80.9041976928711 	 kl mean: 8.345170974731445 	 loss mean: 89.2493667602539
nll mean: 107.01338195800781 	 kl mean: 8.44442081451416 	 loss mean: 115.45779418945312
nll mean: 107.33078002929688 	 kl mean: 8.44442081451416 	 loss mean: 115.77519226074219
nll mean: 106.69654846191406 	 kl mean: 8.44442081451416 	 loss mean: 115.14097595214844
nll mean: 107.42451477050781 	 kl mean: 8.44442081451416 	 loss mean: 115.86893463134766


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 22.23it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.03it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.90it/s][A

nll mean: 106.96485900878906 	 kl mean: 8.44442081451416 	 loss mean: 115.40927124023438
nll mean: 107.1502685546875 	 kl mean: 8.44442081451416 	 loss mean: 115.59469604492188
nll mean: 106.99435424804688 	 kl mean: 8.44442081451416 	 loss mean: 115.43878173828125
nll mean: 107.52796173095703 	 kl mean: 8.44442081451416 	 loss mean: 115.97238159179688
nll mean: 107.01426696777344 	 kl mean: 8.44442081451416 	 loss mean: 115.45869445800781


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
100%|██████████| 10/10 [00:00<00:00, 21.79it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.37it/s][A

nll mean: 106.89672088623047 	 kl mean: 8.44442081451416 	 loss mean: 115.34114074707031
nll mean: 118.72886657714844 	 kl mean: 9.734465599060059 	 loss mean: 128.4633331298828
nll mean: 119.08462524414062 	 kl mean: 9.734465599060059 	 loss mean: 128.819091796875



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.47it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A

nll mean: 118.4395980834961 	 kl mean: 9.734465599060059 	 loss mean: 128.174072265625
nll mean: 118.76409912109375 	 kl mean: 9.734465599060059 	 loss mean: 128.49856567382812
nll mean: 118.90187072753906 	 kl mean: 9.734465599060059 	 loss mean: 128.63633728027344



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.51it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.55it/s][A

nll mean: 118.46602630615234 	 kl mean: 9.734465599060059 	 loss mean: 128.2004852294922
nll mean: 118.95851135253906 	 kl mean: 9.734465599060059 	 loss mean: 128.69297790527344
nll mean: 118.36546325683594 	 kl mean: 9.734465599060059 	 loss mean: 128.0999298095703



                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.50it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.68363189697266 	 kl mean: 9.734465599060059 	 loss mean: 128.4180908203125
nll mean: 118.69692993164062 	 kl mean: 9.734465599060059 	 loss mean: 128.431396484375
nll mean: 59.98345947265625 	 kl mean: 9.962936401367188 	 loss mean: 69.94639587402344


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 10.25it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.21it/s]

nll mean: 59.17311477661133 	 kl mean: 9.962936401367188 	 loss mean: 69.13604736328125
nll mean: 59.811927795410156 	 kl mean: 9.962936401367188 	 loss mean: 69.77485656738281
nll mean: 59.92588424682617 	 kl mean: 9.962936401367188 	 loss mean: 69.88882446289062


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 40%|████      | 4/10 [00:00<00:00, 10.21it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.22it/s][A

nll mean: 60.40302658081055 	 kl mean: 9.962936401367188 	 loss mean: 70.365966796875
nll mean: 60.48198318481445 	 kl mean: 9.962936401367188 	 loss mean: 70.4449234008789
nll mean: 59.955284118652344 	 kl mean: 9.962936401367188 	 loss mean: 69.918212890625


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.22it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.20it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.19it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s]

nll mean: 59.76768112182617 	 kl mean: 9.962936401367188 	 loss mean: 69.73062133789062
nll mean: 60.3194465637207 	 kl mean: 9.962936401367188 	 loss mean: 70.28238677978516
nll mean: 60.33048629760742 	 kl mean: 9.962936401367188 	 loss mean: 70.29341888427734


[A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 13.10it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A

nll mean: 104.18341064453125 	 kl mean: 9.295320510864258 	 loss mean: 113.47872924804688
nll mean: 103.7873306274414 	 kl mean: 9.295320510864258 	 loss mean: 113.08264923095703
nll mean: 103.8519287109375 	 kl mean: 9.295320510864258 	 loss mean: 113.14726257324219



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.00it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.90it/s][A

nll mean: 103.48273468017578 	 kl mean: 9.295320510864258 	 loss mean: 112.77806091308594
nll mean: 104.3616714477539 	 kl mean: 9.295320510864258 	 loss mean: 113.656982421875
nll mean: 103.91364288330078 	 kl mean: 9.295320510864258 	 loss mean: 113.2089614868164



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.74it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A

nll mean: 103.67286682128906 	 kl mean: 9.295320510864258 	 loss mean: 112.96818542480469
nll mean: 103.20098876953125 	 kl mean: 9.295320510864258 	 loss mean: 112.49630737304688
nll mean: 103.37184143066406 	 kl mean: 9.295320510864258 	 loss mean: 112.66716003417969



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.59it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 10%|█         | 1/10 [00:00<00:00,  9.87it/s][A

nll mean: 103.48440551757812 	 kl mean: 9.295320510864258 	 loss mean: 112.77972412109375
nll mean: 136.78150939941406 	 kl mean: 10.33951473236084 	 loss mean: 147.12103271484375



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.87it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.83it/s][A

nll mean: 135.99171447753906 	 kl mean: 10.33951473236084 	 loss mean: 146.3312225341797
nll mean: 136.79421997070312 	 kl mean: 10.33951473236084 	 loss mean: 147.1337432861328



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.85it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.80it/s][A

nll mean: 136.30325317382812 	 kl mean: 10.33951473236084 	 loss mean: 146.6427764892578
nll mean: 136.55203247070312 	 kl mean: 10.33951473236084 	 loss mean: 146.89154052734375



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.84it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.88it/s][A
                                               

nll mean: 136.9752197265625 	 kl mean: 10.33951473236084 	 loss mean: 147.31472778320312
nll mean: 136.56326293945312 	 kl mean: 10.33951473236084 	 loss mean: 146.90277099609375



 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.91it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
[A                                           

nll mean: 136.36334228515625 	 kl mean: 10.33951473236084 	 loss mean: 146.70285034179688
nll mean: 136.53152465820312 	 kl mean: 10.33951473236084 	 loss mean: 146.87103271484375


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.88it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 30%|███       | 3/10 [00:00<00:00, 26.55it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A

nll mean: 136.92047119140625 	 kl mean: 10.33951473236084 	 loss mean: 147.25997924804688
nll mean: 63.03227996826172 	 kl mean: 9.045076370239258 	 loss mean: 72.07736206054688
nll mean: 63.573875427246094 	 kl mean: 9.045076370239258 	 loss mean: 72.61895751953125
nll mean: 63.14482879638672 	 kl mean: 9.045076370239258 	 loss mean: 72.18991088867188
nll mean: 62.56034851074219 	 kl mean: 9.045076370239258 	 loss mean: 71.60543060302734
nll mean: 63.528907775878906 	 kl mean: 9.045076370239258 	 loss mean: 72.57398223876953



                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
 60%|██████    | 6/10 [00:00<00:00, 26.24it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 26.01it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.64it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 63.42680358886719 	 kl mean: 9.045076370239258 	 loss mean: 72.47187805175781
nll mean: 62.974853515625 	 kl mean: 9.045076370239258 	 loss mean: 72.01992797851562
nll mean: 63.438602447509766 	 kl mean: 9.045076370239258 	 loss mean: 72.48367309570312
nll mean: 63.08757400512695 	 kl mean: 9.045076370239258 	 loss mean: 72.13264465332031
nll mean: 63.59669876098633 	 kl mean: 9.045076370239258 	 loss mean: 72.64176940917969


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 30%|███       | 3/10 [00:00<00:00, 21.64it/s][A

nll mean: 116.9849624633789 	 kl mean: 8.958353996276855 	 loss mean: 125.94332885742188
nll mean: 117.03694152832031 	 kl mean: 8.958353996276855 	 loss mean: 125.99529266357422
nll mean: 117.34500122070312 	 kl mean: 8.958353996276855 	 loss mean: 126.30335998535156
nll mean: 117.09866333007812 	 kl mean: 8.958353996276855 	 loss mean: 126.05701446533203
nll mean: 116.67823028564453 	 kl mean: 8.958353996276855 	 loss mean: 125.63658905029297


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 30%|███       | 3/10 [00:00<00:00, 21.64it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.62it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
100%|██████████| 10/10 [00:00<00:00, 21.54it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 117.56356811523438 	 kl mean: 8.958353996276855 	 loss mean: 126.52192687988281
nll mean: 117.05781555175781 	 kl mean: 8.958353996276855 	 loss mean: 126.01618194580078
nll mean: 117.07550048828125 	 kl mean: 8.958353996276855 	 loss mean: 126.03385925292969
nll mean: 117.07902526855469 	 kl mean: 8.958353996276855 	 loss mean: 126.0373764038086
nll mean: 116.90451049804688 	 kl mean: 8.958353996276855 	 loss mean: 125.86286926269531


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 12.29it/s][A

nll mean: 117.92453002929688 	 kl mean: 9.656072616577148 	 loss mean: 127.58060455322266
nll mean: 118.15704345703125 	 kl mean: 9.656072616577148 	 loss mean: 127.81311798095703
nll mean: 118.16273498535156 	 kl mean: 9.656072616577148 	 loss mean: 127.81880187988281


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 12.29it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 40%|████      | 4/10 [00:00<00:00, 12.43it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.50it/s][A

nll mean: 118.2777099609375 	 kl mean: 9.656072616577148 	 loss mean: 127.93377685546875
nll mean: 118.55281066894531 	 kl mean: 9.656072616577148 	 loss mean: 128.20889282226562
nll mean: 117.52486419677734 	 kl mean: 9.656072616577148 	 loss mean: 127.18093872070312


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.50it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.56it/s][A

nll mean: 118.28264617919922 	 kl mean: 9.656072616577148 	 loss mean: 127.93872833251953
nll mean: 118.098876953125 	 kl mean: 9.656072616577148 	 loss mean: 127.75495910644531
nll mean: 117.97535705566406 	 kl mean: 9.656072616577148 	 loss mean: 127.63143920898438


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.56it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.65it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.71it/s][A

nll mean: 117.90491485595703 	 kl mean: 9.656072616577148 	 loss mean: 127.56098175048828
nll mean: 111.87203979492188 	 kl mean: 9.125237464904785 	 loss mean: 120.99728393554688
nll mean: 111.60507202148438 	 kl mean: 9.125237464904785 	 loss mean: 120.73030853271484


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 10.71it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 10.70it/s][A

nll mean: 112.02450561523438 	 kl mean: 9.125237464904785 	 loss mean: 121.14973449707031
nll mean: 112.32395935058594 	 kl mean: 9.125237464904785 	 loss mean: 121.44920349121094
nll mean: 111.98187255859375 	 kl mean: 9.125237464904785 	 loss mean: 121.10710144042969


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 10.70it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.68it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.69it/s][A

nll mean: 111.6219711303711 	 kl mean: 9.125237464904785 	 loss mean: 120.74720764160156
nll mean: 111.72772216796875 	 kl mean: 9.125237464904785 	 loss mean: 120.85295104980469
nll mean: 112.12606811523438 	 kl mean: 9.125237464904785 	 loss mean: 121.25130462646484


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.69it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.67it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]

nll mean: 111.77591705322266 	 kl mean: 9.125237464904785 	 loss mean: 120.90115356445312
nll mean: 111.38533020019531 	 kl mean: 9.125237464904785 	 loss mean: 120.51057434082031
nll mean: 110.39616394042969 	 kl mean: 9.282805442810059 	 loss mean: 119.67897033691406
nll mean: 110.03518676757812 	 kl mean: 9.282805442810059 	 loss mean: 119.3179931640625



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00, 22.96it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.23it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A

nll mean: 110.41075897216797 	 kl mean: 9.282805442810059 	 loss mean: 119.69356536865234
nll mean: 110.09687042236328 	 kl mean: 9.282805442810059 	 loss mean: 119.37967681884766
nll mean: 111.09767150878906 	 kl mean: 9.282805442810059 	 loss mean: 120.38046264648438
nll mean: 110.8721923828125 	 kl mean: 9.282805442810059 	 loss mean: 120.15499877929688
nll mean: 110.64645385742188 	 kl mean: 9.282805442810059 	 loss mean: 119.92926025390625



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.97it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.41it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               


nll mean: 110.35111236572266 	 kl mean: 9.282805442810059 	 loss mean: 119.63391876220703
nll mean: 110.41877746582031 	 kl mean: 9.282805442810059 	 loss mean: 119.70158386230469
nll mean: 111.06343841552734 	 kl mean: 9.282805442810059 	 loss mean: 120.34623718261719
nll mean: 85.03831481933594 	 kl mean: 9.71517562866211 	 loss mean: 94.75349426269531
nll mean: 84.28899383544922 	 kl mean: 9.71517562866211 	 loss mean: 94.0041732788086


 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 30.80it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
 80%|████████  | 8/10 [00:00<00:00, 30.68it/s][A

nll mean: 85.03936767578125 	 kl mean: 9.71517562866211 	 loss mean: 94.7545394897461
nll mean: 84.77288818359375 	 kl mean: 9.71517562866211 	 loss mean: 94.48806762695312
nll mean: 84.54942321777344 	 kl mean: 9.71517562866211 	 loss mean: 94.26458740234375
nll mean: 85.45037078857422 	 kl mean: 9.71517562866211 	 loss mean: 95.16554260253906
nll mean: 84.13719940185547 	 kl mean: 9.71517562866211 	 loss mean: 93.85237884521484
nll mean: 84.95956420898438 	 kl mean: 9.71517562866211 	 loss mean: 94.67472839355469
nll mean: 84.68633270263672 	 kl mean: 9.71517562866211 	 loss mean: 94.4015121459961


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
100%|██████████| 10/10 [00:00<00:00, 30.48it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.56it/s]


nll mean: 84.92535400390625 	 kl mean: 9.71517562866211 	 loss mean: 94.6405258178711
Approximate NLL:
tensor(119.8687, device='cuda:0')
Approximate KL:
tensor(9.5362, device='cuda:0')
Testing took 0:00:25.287751


  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 25.50it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].50it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].50it/s][A
[A                                           

nll mean: 108.76423645019531 	 kl mean: 10.458614349365234 	 loss mean: 119.22285461425781
nll mean: 108.60208129882812 	 kl mean: 10.458614349365234 	 loss mean: 119.06069946289062
nll mean: 109.0098876953125 	 kl mean: 10.458614349365234 	 loss mean: 119.468505859375
nll mean: 108.74803161621094 	 kl mean: 10.458614349365234 	 loss mean: 119.20664978027344
nll mean: 108.8069839477539 	 kl mean: 10.458614349365234 	 loss mean: 119.26559448242188


                                      
  0%|          | 0/38 [00:00<?, ?it/s].50it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.36it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].36it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].36it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].36it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.75it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 24.62it/s][A
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 109.00020599365234 	 kl mean: 10.458614349365234 	 loss mean: 119.45882415771484
nll mean: 108.26731872558594 	 kl mean: 10.458614349365234 	 loss mean: 118.7259292602539
nll mean: 109.20751953125 	 kl mean: 10.458614349365234 	 loss mean: 119.6661376953125
nll mean: 108.84512329101562 	 kl mean: 10.458614349365234 	 loss mean: 119.30374145507812
nll mean: 109.11785888671875 	 kl mean: 10.458614349365234 	 loss mean: 119.57646942138672


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
 20%|██        | 2/10 [00:00<00:00, 13.74it/s][A

nll mean: 125.1038818359375 	 kl mean: 9.974714279174805 	 loss mean: 135.07858276367188
nll mean: 124.67599487304688 	 kl mean: 9.974714279174805 	 loss mean: 134.65069580078125
nll mean: 124.2425308227539 	 kl mean: 9.974714279174805 	 loss mean: 134.21725463867188


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
 20%|██        | 2/10 [00:00<00:00, 13.74it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
 40%|████      | 4/10 [00:00<00:00, 13.86it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.94it/s][A

nll mean: 124.85159301757812 	 kl mean: 9.974714279174805 	 loss mean: 134.82630920410156
nll mean: 125.28033447265625 	 kl mean: 9.974714279174805 	 loss mean: 135.25506591796875
nll mean: 124.58969116210938 	 kl mean: 9.974714279174805 	 loss mean: 134.5644073486328


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.94it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:15,  2.45it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.96it/s][A

nll mean: 125.02169799804688 	 kl mean: 9.974714279174805 	 loss mean: 134.99642944335938
nll mean: 125.57782745361328 	 kl mean: 9.974714279174805 	 loss mean: 135.5525360107422
nll mean: 124.43756103515625 	 kl mean: 9.974714279174805 	 loss mean: 134.41226196289062


                                              
  3%|▎         | 1/38 [00:01<00:15,  2.45it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.96it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.04it/s][A
  5%|▌         | 2/38 [00:01<00:18,  2.00it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:18,  2.00it/s]
                                              
  5%|▌         | 2/38 [00:01<00:18,  2.00it/s]
                                              
  5%|▌         | 2/38 [00:01<00:18,  2.00it/s]
 30%|███       | 3/10 [00:00<00:00, 25.34it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:18,  2.00it/s][A

nll mean: 125.22669982910156 	 kl mean: 9.974714279174805 	 loss mean: 135.201416015625
nll mean: 97.93878173828125 	 kl mean: 9.363335609436035 	 loss mean: 107.30210876464844
nll mean: 97.79881286621094 	 kl mean: 9.363335609436035 	 loss mean: 107.16214752197266
nll mean: 97.10025024414062 	 kl mean: 9.363335609436035 	 loss mean: 106.46358489990234
nll mean: 97.88095092773438 	 kl mean: 9.363335609436035 	 loss mean: 107.2442855834961



                                              
  5%|▌         | 2/38 [00:01<00:18,  2.00it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:18,  2.00it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.73it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:18,  2.00it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:18,  2.00it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:18,  2.00it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.47it/s][A

nll mean: 97.84135437011719 	 kl mean: 9.363335609436035 	 loss mean: 107.20469665527344
nll mean: 97.216796875 	 kl mean: 9.363335609436035 	 loss mean: 106.58013916015625
nll mean: 96.97848510742188 	 kl mean: 9.363335609436035 	 loss mean: 106.3418197631836
nll mean: 97.80195617675781 	 kl mean: 9.363335609436035 	 loss mean: 107.16529846191406
nll mean: 97.18537902832031 	 kl mean: 9.363335609436035 	 loss mean: 106.5487060546875



                                              
100%|██████████| 10/10 [00:00<00:00, 24.25it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s]
 20%|██        | 2/10 [00:00<00:00, 10.80it/s][A

nll mean: 97.35164642333984 	 kl mean: 9.363335609436035 	 loss mean: 106.71498107910156
nll mean: 137.05078125 	 kl mean: 9.480364799499512 	 loss mean: 146.53115844726562
nll mean: 137.79637145996094 	 kl mean: 9.480364799499512 	 loss mean: 147.2767333984375



                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.80it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s][A

nll mean: 137.77297973632812 	 kl mean: 9.480364799499512 	 loss mean: 147.2533416748047
nll mean: 137.5648956298828 	 kl mean: 9.480364799499512 	 loss mean: 147.04525756835938
nll mean: 137.376708984375 	 kl mean: 9.480364799499512 	 loss mean: 146.85708618164062



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.79it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.78it/s][A

nll mean: 137.6040802001953 	 kl mean: 9.480364799499512 	 loss mean: 147.08444213867188
nll mean: 137.25352478027344 	 kl mean: 9.480364799499512 	 loss mean: 146.73388671875
nll mean: 137.90216064453125 	 kl mean: 9.480364799499512 	 loss mean: 147.3825225830078



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.75it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 137.6167755126953 	 kl mean: 9.480364799499512 	 loss mean: 147.09713745117188
nll mean: 137.57281494140625 	 kl mean: 9.480364799499512 	 loss mean: 147.05319213867188
nll mean: 125.33926391601562 	 kl mean: 9.31458854675293 	 loss mean: 134.65386962890625


                                              
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
 20%|██        | 2/10 [00:00<00:00, 14.48it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.53it/s][A

nll mean: 124.29898071289062 	 kl mean: 9.31458854675293 	 loss mean: 133.6135711669922
nll mean: 124.73880004882812 	 kl mean: 9.31458854675293 	 loss mean: 134.0533905029297
nll mean: 124.787841796875 	 kl mean: 9.31458854675293 	 loss mean: 134.10243225097656


                                              
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
 40%|████      | 4/10 [00:00<00:00, 14.53it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.44it/s][A

nll mean: 124.36138153076172 	 kl mean: 9.31458854675293 	 loss mean: 133.67596435546875
nll mean: 124.80033874511719 	 kl mean: 9.31458854675293 	 loss mean: 134.11492919921875
nll mean: 125.19876861572266 	 kl mean: 9.31458854675293 	 loss mean: 134.51336669921875


                                              
 11%|█         | 4/38 [00:03<00:20,  1.63it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.44it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.63it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.63it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.38it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.39it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 124.80349731445312 	 kl mean: 9.31458854675293 	 loss mean: 134.1180877685547
nll mean: 124.97030639648438 	 kl mean: 9.31458854675293 	 loss mean: 134.28488159179688
nll mean: 125.08672332763672 	 kl mean: 9.31458854675293 	 loss mean: 134.40130615234375



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 14.25it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A

nll mean: 122.96159362792969 	 kl mean: 9.525859832763672 	 loss mean: 132.48745727539062
nll mean: 122.8905029296875 	 kl mean: 9.525859832763672 	 loss mean: 132.41636657714844
nll mean: 122.679443359375 	 kl mean: 9.525859832763672 	 loss mean: 132.20529174804688



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.18it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.22it/s][A

nll mean: 123.05008697509766 	 kl mean: 9.525859832763672 	 loss mean: 132.57595825195312
nll mean: 122.80705261230469 	 kl mean: 9.525859832763672 	 loss mean: 132.33290100097656
nll mean: 122.67213439941406 	 kl mean: 9.525859832763672 	 loss mean: 132.197998046875



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.28it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A

nll mean: 123.65716552734375 	 kl mean: 9.525859832763672 	 loss mean: 133.18304443359375
nll mean: 123.15463256835938 	 kl mean: 9.525859832763672 	 loss mean: 132.68051147460938
nll mean: 123.26992797851562 	 kl mean: 9.525859832763672 	 loss mean: 132.79579162597656



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.12it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 25.21it/s][A

nll mean: 123.41880798339844 	 kl mean: 9.525859832763672 	 loss mean: 132.94467163085938
nll mean: 131.14073181152344 	 kl mean: 9.666733741760254 	 loss mean: 140.80746459960938
nll mean: 132.20407104492188 	 kl mean: 9.666733741760254 	 loss mean: 141.87081909179688
nll mean: 131.61207580566406 	 kl mean: 9.666733741760254 	 loss mean: 141.27880859375
nll mean: 131.67396545410156 	 kl mean: 9.666733741760254 	 loss mean: 141.3406982421875


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 25.21it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.04it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.00it/s][A

nll mean: 131.69140625 	 kl mean: 9.666733741760254 	 loss mean: 141.35813903808594
nll mean: 131.92706298828125 	 kl mean: 9.666733741760254 	 loss mean: 141.59381103515625
nll mean: 131.6800537109375 	 kl mean: 9.666733741760254 	 loss mean: 141.3468017578125
nll mean: 131.5045166015625 	 kl mean: 9.666733741760254 	 loss mean: 141.1712646484375
nll mean: 131.08090209960938 	 kl mean: 9.666733741760254 	 loss mean: 140.7476348876953


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
100%|██████████| 10/10 [00:00<00:00, 24.87it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s]
 30%|███       | 3/10 [00:00<00:00, 25.19it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A

nll mean: 131.32687377929688 	 kl mean: 9.666733741760254 	 loss mean: 140.99362182617188
nll mean: 104.52268981933594 	 kl mean: 9.326852798461914 	 loss mean: 113.84953308105469
nll mean: 104.01787567138672 	 kl mean: 9.326852798461914 	 loss mean: 113.34473419189453
nll mean: 104.3155517578125 	 kl mean: 9.326852798461914 	 loss mean: 113.64240264892578
nll mean: 104.83892822265625 	 kl mean: 9.326852798461914 	 loss mean: 114.16577911376953



                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.06it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.72it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.00it/s][A


nll mean: 104.37602233886719 	 kl mean: 9.326852798461914 	 loss mean: 113.702880859375
nll mean: 104.386474609375 	 kl mean: 9.326852798461914 	 loss mean: 113.71332550048828
nll mean: 104.13363647460938 	 kl mean: 9.326852798461914 	 loss mean: 113.46048736572266
nll mean: 104.21078491210938 	 kl mean: 9.326852798461914 	 loss mean: 113.53764343261719
nll mean: 104.06463623046875 	 kl mean: 9.326852798461914 	 loss mean: 113.3914794921875


                                              
100%|██████████| 10/10 [00:00<00:00, 24.90it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s]
 20%|██        | 2/10 [00:00<00:00, 15.34it/s][A

nll mean: 104.43276977539062 	 kl mean: 9.326852798461914 	 loss mean: 113.7596206665039
nll mean: 129.85336303710938 	 kl mean: 10.088837623596191 	 loss mean: 139.94219970703125
nll mean: 129.7270050048828 	 kl mean: 10.088837623596191 	 loss mean: 139.81585693359375



                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.89it/s][A
 40%|████      | 4/10 [00:00<00:00, 15.01it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.89it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.89it/s][A
 60%|██████    | 6/10 [00:00<00:00, 15.12it/s]

nll mean: 130.17633056640625 	 kl mean: 10.088837623596191 	 loss mean: 140.26516723632812
nll mean: 129.86102294921875 	 kl mean: 10.088837623596191 	 loss mean: 139.94985961914062
nll mean: 130.30859375 	 kl mean: 10.088837623596191 	 loss mean: 140.39743041992188
nll mean: 129.9330596923828 	 kl mean: 10.088837623596191 	 loss mean: 140.02188110351562


[A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.89it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.89it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.59it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.89it/s][A

nll mean: 129.71319580078125 	 kl mean: 10.088837623596191 	 loss mean: 139.8020477294922
nll mean: 130.02008056640625 	 kl mean: 10.088837623596191 	 loss mean: 140.10891723632812
nll mean: 130.0428466796875 	 kl mean: 10.088837623596191 	 loss mean: 140.13168334960938



                                              
 21%|██        | 8/38 [00:05<00:15,  1.89it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.58it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.66it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A

nll mean: 129.77059936523438 	 kl mean: 10.088837623596191 	 loss mean: 139.85943603515625
nll mean: 130.09906005859375 	 kl mean: 9.799177169799805 	 loss mean: 139.8982391357422
nll mean: 130.54122924804688 	 kl mean: 9.799177169799805 	 loss mean: 140.34042358398438
nll mean: 129.86444091796875 	 kl mean: 9.799177169799805 	 loss mean: 139.66360473632812
nll mean: 130.3935546875 	 kl mean: 9.799177169799805 	 loss mean: 140.19273376464844



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.40it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.30it/s][A

nll mean: 131.14938354492188 	 kl mean: 9.799177169799805 	 loss mean: 140.9485626220703
nll mean: 130.47145080566406 	 kl mean: 9.799177169799805 	 loss mean: 140.2706298828125
nll mean: 130.0972137451172 	 kl mean: 9.799177169799805 	 loss mean: 139.89639282226562
nll mean: 130.64495849609375 	 kl mean: 9.799177169799805 	 loss mean: 140.44415283203125
nll mean: 129.6143798828125 	 kl mean: 9.799177169799805 	 loss mean: 139.41355895996094



                                              
100%|██████████| 10/10 [00:00<00:00, 21.10it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
 30%|███       | 3/10 [00:00<00:00, 25.00it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A

nll mean: 130.05189514160156 	 kl mean: 9.799177169799805 	 loss mean: 139.85107421875
nll mean: 117.50326538085938 	 kl mean: 9.666709899902344 	 loss mean: 127.16997528076172
nll mean: 117.11053466796875 	 kl mean: 9.666709899902344 	 loss mean: 126.77725219726562
nll mean: 117.4044189453125 	 kl mean: 9.666709899902344 	 loss mean: 127.07113647460938
nll mean: 117.04682922363281 	 kl mean: 9.666709899902344 	 loss mean: 126.71353149414062



                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.87it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.74it/s][A

nll mean: 117.68914794921875 	 kl mean: 9.666709899902344 	 loss mean: 127.3558578491211
nll mean: 117.72596740722656 	 kl mean: 9.666709899902344 	 loss mean: 127.3926773071289
nll mean: 117.31732177734375 	 kl mean: 9.666709899902344 	 loss mean: 126.9840316772461
nll mean: 117.68499755859375 	 kl mean: 9.666709899902344 	 loss mean: 127.35171508789062
nll mean: 117.36238861083984 	 kl mean: 9.666709899902344 	 loss mean: 127.02909851074219



                                               
100%|██████████| 10/10 [00:00<00:00, 24.61it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
 30%|███       | 3/10 [00:00<00:00, 21.58it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A

nll mean: 117.3550033569336 	 kl mean: 9.666709899902344 	 loss mean: 127.02171325683594
nll mean: 140.25706481933594 	 kl mean: 9.844732284545898 	 loss mean: 150.10179138183594
nll mean: 140.645263671875 	 kl mean: 9.844732284545898 	 loss mean: 150.489990234375
nll mean: 140.57318115234375 	 kl mean: 9.844732284545898 	 loss mean: 150.41790771484375
nll mean: 140.78329467773438 	 kl mean: 9.844732284545898 	 loss mean: 150.62802124023438



                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.32it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.23it/s][A

nll mean: 140.26177978515625 	 kl mean: 9.844732284545898 	 loss mean: 150.1065216064453
nll mean: 140.30328369140625 	 kl mean: 9.844732284545898 	 loss mean: 150.14801025390625
nll mean: 140.1558074951172 	 kl mean: 9.844732284545898 	 loss mean: 150.0005340576172
nll mean: 140.49014282226562 	 kl mean: 9.844732284545898 	 loss mean: 150.33486938476562
nll mean: 140.52987670898438 	 kl mean: 9.844732284545898 	 loss mean: 150.37460327148438



                                               
100%|██████████| 10/10 [00:00<00:00, 21.04it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.75it/s][A

nll mean: 140.87120056152344 	 kl mean: 9.844732284545898 	 loss mean: 150.7159423828125
nll mean: 119.31819915771484 	 kl mean: 9.845075607299805 	 loss mean: 129.16326904296875
nll mean: 119.43960571289062 	 kl mean: 9.845075607299805 	 loss mean: 129.28468322753906


                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
 20%|██        | 2/10 [00:00<00:00, 12.75it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
 40%|████      | 4/10 [00:00<00:00, 12.66it/s][A

nll mean: 118.98636627197266 	 kl mean: 9.845075607299805 	 loss mean: 128.83145141601562
nll mean: 119.22193908691406 	 kl mean: 9.845075607299805 	 loss mean: 129.0670166015625
nll mean: 119.32689666748047 	 kl mean: 9.845075607299805 	 loss mean: 129.17196655273438


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
 40%|████      | 4/10 [00:00<00:00, 12.66it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.60it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.46it/s][A

nll mean: 119.48159790039062 	 kl mean: 9.845075607299805 	 loss mean: 129.32666015625
nll mean: 118.73084259033203 	 kl mean: 9.845075607299805 	 loss mean: 128.575927734375
nll mean: 119.55056762695312 	 kl mean: 9.845075607299805 	 loss mean: 129.39564514160156


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.45it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
 10%|█         | 1/10 [00:00<00:00,  9.90it/s][A

nll mean: 119.18436431884766 	 kl mean: 9.845075607299805 	 loss mean: 129.02943420410156
nll mean: 119.27314758300781 	 kl mean: 9.845075607299805 	 loss mean: 129.11822509765625
nll mean: 160.1762237548828 	 kl mean: 10.971343040466309 	 loss mean: 171.14755249023438



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.84it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.81it/s][A

nll mean: 160.75668334960938 	 kl mean: 10.971343040466309 	 loss mean: 171.72802734375
nll mean: 160.0225830078125 	 kl mean: 10.971343040466309 	 loss mean: 170.99392700195312



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.86it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.87it/s][A
                                              

nll mean: 159.91082763671875 	 kl mean: 10.971343040466309 	 loss mean: 170.88217163085938
nll mean: 160.35934448242188 	 kl mean: 10.971343040466309 	 loss mean: 171.3306884765625


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.89it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.89it/s][A
                                              

nll mean: 160.75704956054688 	 kl mean: 10.971343040466309 	 loss mean: 171.7283935546875
nll mean: 160.12608337402344 	 kl mean: 10.971343040466309 	 loss mean: 171.097412109375


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.94it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A

nll mean: 159.9074249267578 	 kl mean: 10.971343040466309 	 loss mean: 170.87876892089844
nll mean: 159.55923461914062 	 kl mean: 10.971343040466309 	 loss mean: 170.5305633544922
nll mean: 160.1227569580078 	 kl mean: 10.971343040466309 	 loss mean: 171.09408569335938



100%|██████████| 10/10 [00:01<00:00,  9.91it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.28it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 40%|████      | 4/10 [00:00<00:00, 18.08it/s][A

nll mean: 133.24102783203125 	 kl mean: 9.504106521606445 	 loss mean: 142.74513244628906
nll mean: 133.47006225585938 	 kl mean: 9.504106521606445 	 loss mean: 142.97418212890625
nll mean: 132.75148010253906 	 kl mean: 9.504106521606445 	 loss mean: 142.25558471679688
nll mean: 133.41017150878906 	 kl mean: 9.504106521606445 	 loss mean: 142.91427612304688



                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 60%|██████    | 6/10 [00:00<00:00, 18.09it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
 80%|████████  | 8/10 [00:00<00:00, 18.05it/s][A

nll mean: 133.10462951660156 	 kl mean: 9.504106521606445 	 loss mean: 142.60873413085938
nll mean: 133.40130615234375 	 kl mean: 9.504106521606445 	 loss mean: 142.90542602539062
nll mean: 133.39297485351562 	 kl mean: 9.504106521606445 	 loss mean: 142.89707946777344
nll mean: 132.9939727783203 	 kl mean: 9.504106521606445 	 loss mean: 142.49807739257812



                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.93it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]

nll mean: 133.58248901367188 	 kl mean: 9.504106521606445 	 loss mean: 143.08660888671875
nll mean: 133.80722045898438 	 kl mean: 9.504106521606445 	 loss mean: 143.31134033203125
nll mean: 141.44097900390625 	 kl mean: 10.027235984802246 	 loss mean: 151.4682159423828



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 20%|██        | 2/10 [00:00<00:00, 10.79it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.82it/s][A

nll mean: 142.0129852294922 	 kl mean: 10.027235984802246 	 loss mean: 152.04022216796875
nll mean: 142.9373016357422 	 kl mean: 10.027235984802246 	 loss mean: 152.96453857421875
nll mean: 141.7235107421875 	 kl mean: 10.027235984802246 	 loss mean: 151.75074768066406



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.81it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A

nll mean: 142.12158203125 	 kl mean: 10.027235984802246 	 loss mean: 152.14881896972656
nll mean: 141.90219116210938 	 kl mean: 10.027235984802246 	 loss mean: 151.929443359375
nll mean: 141.82684326171875 	 kl mean: 10.027235984802246 	 loss mean: 151.85409545898438



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.77it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
                                               
 39%|███▉      | 15/38 [00:10<00:15,  1.49it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.73it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 141.8656005859375 	 kl mean: 10.027235984802246 	 loss mean: 151.89285278320312
nll mean: 142.32894897460938 	 kl mean: 10.027235984802246 	 loss mean: 152.356201171875
nll mean: 142.02239990234375 	 kl mean: 10.027235984802246 	 loss mean: 152.04965209960938


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 24.58it/s][A

nll mean: 141.67239379882812 	 kl mean: 9.418211936950684 	 loss mean: 151.09060668945312
nll mean: 141.46995544433594 	 kl mean: 9.418211936950684 	 loss mean: 150.88815307617188
nll mean: 141.3652801513672 	 kl mean: 9.418211936950684 	 loss mean: 150.7834930419922
nll mean: 141.8080596923828 	 kl mean: 9.418211936950684 	 loss mean: 151.2262725830078
nll mean: 141.97113037109375 	 kl mean: 9.418211936950684 	 loss mean: 151.38934326171875


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 24.58it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.56it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
100%|██████████| 10/10 [00:00<00:00, 24.67it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 142.59146118164062 	 kl mean: 9.418211936950684 	 loss mean: 152.00967407226562
nll mean: 141.6379852294922 	 kl mean: 9.418211936950684 	 loss mean: 151.05621337890625
nll mean: 141.5936279296875 	 kl mean: 9.418211936950684 	 loss mean: 151.0118408203125
nll mean: 141.62806701660156 	 kl mean: 9.418211936950684 	 loss mean: 151.04629516601562
nll mean: 142.1893310546875 	 kl mean: 9.418211936950684 	 loss mean: 151.6075439453125



                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 25.19it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 30%|███       | 3/10 [00:00<00:00, 25.19it/s][A

nll mean: 133.66554260253906 	 kl mean: 10.082940101623535 	 loss mean: 143.74847412109375
nll mean: 133.22286987304688 	 kl mean: 10.082940101623535 	 loss mean: 143.30581665039062
nll mean: 133.3141326904297 	 kl mean: 10.082940101623535 	 loss mean: 143.39707946777344
nll mean: 133.3690185546875 	 kl mean: 10.082940101623535 	 loss mean: 143.45196533203125
nll mean: 133.324462890625 	 kl mean: 10.082940101623535 	 loss mean: 143.4073944091797
nll mean: 133.08563232421875 	 kl mean: 10.082940101623535 	 loss mean: 143.16856384277344


 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.13it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.03it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 24.93it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 133.49932861328125 	 kl mean: 10.082940101623535 	 loss mean: 143.582275390625
nll mean: 133.0819091796875 	 kl mean: 10.082940101623535 	 loss mean: 143.16485595703125
nll mean: 133.52606201171875 	 kl mean: 10.082940101623535 	 loss mean: 143.6090087890625
nll mean: 133.60000610351562 	 kl mean: 10.082940101623535 	 loss mean: 143.68295288085938



                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.74it/s]
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s]
 20%|██        | 2/10 [00:00<00:00, 12.53it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A

nll mean: 126.13919830322266 	 kl mean: 11.162394523620605 	 loss mean: 137.3015899658203
nll mean: 126.24687194824219 	 kl mean: 11.162394523620605 	 loss mean: 137.4092559814453
nll mean: 125.92256164550781 	 kl mean: 11.162394523620605 	 loss mean: 137.08494567871094



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.48it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.42it/s][A

nll mean: 126.32371520996094 	 kl mean: 11.162394523620605 	 loss mean: 137.48611450195312
nll mean: 126.0499038696289 	 kl mean: 11.162394523620605 	 loss mean: 137.2122802734375
nll mean: 125.66650390625 	 kl mean: 11.162394523620605 	 loss mean: 136.82888793945312



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.45it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A

nll mean: 126.2404556274414 	 kl mean: 11.162394523620605 	 loss mean: 137.40284729003906
nll mean: 126.77674865722656 	 kl mean: 11.162394523620605 	 loss mean: 137.9391326904297
nll mean: 126.28849029541016 	 kl mean: 11.162394523620605 	 loss mean: 137.45086669921875



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.38it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 12.49it/s][A

nll mean: 125.60810852050781 	 kl mean: 11.162394523620605 	 loss mean: 136.7705078125
nll mean: 146.28173828125 	 kl mean: 10.211620330810547 	 loss mean: 156.4933624267578
nll mean: 146.32400512695312 	 kl mean: 10.211620330810547 	 loss mean: 156.53562927246094



                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.50it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A

nll mean: 146.01806640625 	 kl mean: 10.211620330810547 	 loss mean: 156.2296905517578
nll mean: 146.03277587890625 	 kl mean: 10.211620330810547 	 loss mean: 156.24440002441406
nll mean: 146.3280029296875 	 kl mean: 10.211620330810547 	 loss mean: 156.5396270751953



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.57it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.66it/s][A

nll mean: 146.7247314453125 	 kl mean: 10.211620330810547 	 loss mean: 156.93634033203125
nll mean: 146.22067260742188 	 kl mean: 10.211620330810547 	 loss mean: 156.43231201171875
nll mean: 146.0948944091797 	 kl mean: 10.211620330810547 	 loss mean: 156.3065185546875



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.68it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 145.7213134765625 	 kl mean: 10.211620330810547 	 loss mean: 155.93292236328125
nll mean: 145.6098175048828 	 kl mean: 10.211620330810547 	 loss mean: 155.82144165039062
nll mean: 154.3750762939453 	 kl mean: 9.747068405151367 	 loss mean: 164.12213134765625


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 20%|██        | 2/10 [00:00<00:00, 12.58it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.60it/s][A

nll mean: 153.837646484375 	 kl mean: 9.747068405151367 	 loss mean: 163.584716796875
nll mean: 154.12701416015625 	 kl mean: 9.747068405151367 	 loss mean: 163.8740997314453
nll mean: 154.43910217285156 	 kl mean: 9.747068405151367 	 loss mean: 164.1861572265625


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 40%|████      | 4/10 [00:00<00:00, 12.60it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.54it/s][A

nll mean: 154.59889221191406 	 kl mean: 9.747068405151367 	 loss mean: 164.34596252441406
nll mean: 153.92987060546875 	 kl mean: 9.747068405151367 	 loss mean: 163.67694091796875
nll mean: 154.21170043945312 	 kl mean: 9.747068405151367 	 loss mean: 163.95877075195312


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.54it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.69it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.70it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 153.75018310546875 	 kl mean: 9.747068405151367 	 loss mean: 163.4972686767578
nll mean: 153.93798828125 	 kl mean: 9.747068405151367 	 loss mean: 163.68505859375
nll mean: 154.21673583984375 	 kl mean: 9.747068405151367 	 loss mean: 163.96380615234375



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 10.47it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.31it/s][A

nll mean: 116.03817749023438 	 kl mean: 9.755216598510742 	 loss mean: 125.79338073730469
nll mean: 116.01422119140625 	 kl mean: 9.755216598510742 	 loss mean: 125.76943969726562
nll mean: 115.73613739013672 	 kl mean: 9.755216598510742 	 loss mean: 125.4913558959961



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.29it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s][A

nll mean: 115.84687805175781 	 kl mean: 9.755216598510742 	 loss mean: 125.60209655761719
nll mean: 115.76583862304688 	 kl mean: 9.755216598510742 	 loss mean: 125.52105712890625
nll mean: 116.32498931884766 	 kl mean: 9.755216598510742 	 loss mean: 126.0802001953125



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.29it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.15it/s][A
                                               


nll mean: 115.93125915527344 	 kl mean: 9.755216598510742 	 loss mean: 125.68646240234375
nll mean: 115.67716979980469 	 kl mean: 9.755216598510742 	 loss mean: 125.4323959350586
nll mean: 116.17898559570312 	 kl mean: 9.755216598510742 	 loss mean: 125.9342041015625


 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.17it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 32.17it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A

nll mean: 115.8739013671875 	 kl mean: 9.755216598510742 	 loss mean: 125.62911987304688
nll mean: 104.63705444335938 	 kl mean: 9.18754768371582 	 loss mean: 113.8246078491211
nll mean: 104.9163589477539 	 kl mean: 9.18754768371582 	 loss mean: 114.10391235351562
nll mean: 104.689697265625 	 kl mean: 9.18754768371582 	 loss mean: 113.87724304199219
nll mean: 104.65264892578125 	 kl mean: 9.18754768371582 	 loss mean: 113.84019470214844
nll mean: 104.68046569824219 	 kl mean: 9.18754768371582 	 loss mean: 113.86801147460938
nll mean: 104.7457046508789 	 kl mean: 9.18754768371582 	 loss mean: 113.9332504272461



                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
 80%|████████  | 8/10 [00:00<00:00, 31.86it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 31.13it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]

nll mean: 104.73090362548828 	 kl mean: 9.18754768371582 	 loss mean: 113.91844940185547
nll mean: 104.85476684570312 	 kl mean: 9.18754768371582 	 loss mean: 114.04231262207031
nll mean: 105.28124237060547 	 kl mean: 9.18754768371582 	 loss mean: 114.46879577636719
nll mean: 104.73252868652344 	 kl mean: 9.18754768371582 	 loss mean: 113.92007446289062
nll mean: 157.38206481933594 	 kl mean: 10.103671073913574 	 loss mean: 167.48573303222656



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
 20%|██        | 2/10 [00:00<00:00, 14.57it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.53it/s][A

nll mean: 157.3966064453125 	 kl mean: 10.103671073913574 	 loss mean: 167.5002899169922
nll mean: 157.66091918945312 	 kl mean: 10.103671073913574 	 loss mean: 167.76458740234375
nll mean: 156.9484405517578 	 kl mean: 10.103671073913574 	 loss mean: 167.0521240234375



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.61it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s][A

nll mean: 156.78094482421875 	 kl mean: 10.103671073913574 	 loss mean: 166.88462829589844
nll mean: 157.033935546875 	 kl mean: 10.103671073913574 	 loss mean: 167.13760375976562
nll mean: 157.1053009033203 	 kl mean: 10.103671073913574 	 loss mean: 167.20896911621094



                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.67it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.65it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]

nll mean: 157.29214477539062 	 kl mean: 10.103671073913574 	 loss mean: 167.39581298828125
nll mean: 156.7451171875 	 kl mean: 10.103671073913574 	 loss mean: 166.84877014160156
nll mean: 157.15399169921875 	 kl mean: 10.103671073913574 	 loss mean: 167.25765991210938
nll mean: 118.62226867675781 	 kl mean: 10.944461822509766 	 loss mean: 129.56674194335938



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
 30%|███       | 3/10 [00:00<00:00, 21.88it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.68it/s][A

nll mean: 119.20987701416016 	 kl mean: 10.944461822509766 	 loss mean: 130.15432739257812
nll mean: 119.01826477050781 	 kl mean: 10.944461822509766 	 loss mean: 129.9627227783203
nll mean: 118.50759887695312 	 kl mean: 10.944461822509766 	 loss mean: 129.45205688476562
nll mean: 118.74658203125 	 kl mean: 10.944461822509766 	 loss mean: 129.6910400390625
nll mean: 118.52076721191406 	 kl mean: 10.944461822509766 	 loss mean: 129.46522521972656



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.44it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.41it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.99606323242188 	 kl mean: 10.944461822509766 	 loss mean: 129.94053649902344
nll mean: 118.73152160644531 	 kl mean: 10.944461822509766 	 loss mean: 129.6759796142578
nll mean: 119.02487182617188 	 kl mean: 10.944461822509766 	 loss mean: 129.96932983398438
nll mean: 118.57591247558594 	 kl mean: 10.944461822509766 	 loss mean: 129.52037048339844



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.57it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s][A

nll mean: 113.63658142089844 	 kl mean: 9.549755096435547 	 loss mean: 123.18633270263672
nll mean: 113.5959701538086 	 kl mean: 9.549755096435547 	 loss mean: 123.14572143554688
nll mean: 113.19722747802734 	 kl mean: 9.549755096435547 	 loss mean: 122.74697875976562



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.62it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.76it/s][A

nll mean: 112.87299346923828 	 kl mean: 9.549755096435547 	 loss mean: 122.42273712158203
nll mean: 113.50936889648438 	 kl mean: 9.549755096435547 	 loss mean: 123.05912780761719
nll mean: 113.70309448242188 	 kl mean: 9.549755096435547 	 loss mean: 123.25285339355469



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.68it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A

nll mean: 113.55791473388672 	 kl mean: 9.549755096435547 	 loss mean: 123.107666015625
nll mean: 113.79440307617188 	 kl mean: 9.549755096435547 	 loss mean: 123.34415435791016
nll mean: 114.019287109375 	 kl mean: 9.549755096435547 	 loss mean: 123.56904602050781



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.69it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 22.03it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A

nll mean: 113.26849365234375 	 kl mean: 9.549755096435547 	 loss mean: 122.81825256347656
nll mean: 81.96749877929688 	 kl mean: 8.699159622192383 	 loss mean: 90.66665649414062
nll mean: 81.66858673095703 	 kl mean: 8.699159622192383 	 loss mean: 90.36774444580078
nll mean: 81.57560729980469 	 kl mean: 8.699159622192383 	 loss mean: 90.27476501464844
nll mean: 81.63269805908203 	 kl mean: 8.699159622192383 	 loss mean: 90.33186340332031



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.23it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.24it/s][A

nll mean: 81.59686279296875 	 kl mean: 8.699159622192383 	 loss mean: 90.2960205078125
nll mean: 81.46900939941406 	 kl mean: 8.699159622192383 	 loss mean: 90.16816711425781
nll mean: 81.41187286376953 	 kl mean: 8.699159622192383 	 loss mean: 90.11103057861328
nll mean: 81.16120147705078 	 kl mean: 8.699159622192383 	 loss mean: 89.86036682128906
nll mean: 81.33043670654297 	 kl mean: 8.699159622192383 	 loss mean: 90.02959442138672



                                               
100%|██████████| 10/10 [00:00<00:00, 22.15it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 20.89it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A

nll mean: 81.85015869140625 	 kl mean: 8.699159622192383 	 loss mean: 90.54931640625
nll mean: 107.96294403076172 	 kl mean: 9.09119987487793 	 loss mean: 117.05413818359375
nll mean: 107.98954772949219 	 kl mean: 9.09119987487793 	 loss mean: 117.08074951171875
nll mean: 107.92171478271484 	 kl mean: 9.09119987487793 	 loss mean: 117.01292419433594
nll mean: 108.43512725830078 	 kl mean: 9.09119987487793 	 loss mean: 117.52632141113281



                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 20.85it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 20.81it/s][A

nll mean: 108.31436157226562 	 kl mean: 9.09119987487793 	 loss mean: 117.40556335449219
nll mean: 108.63583374023438 	 kl mean: 9.09119987487793 	 loss mean: 117.7270278930664
nll mean: 108.3893051147461 	 kl mean: 9.09119987487793 	 loss mean: 117.48049926757812
nll mean: 108.40585327148438 	 kl mean: 9.09119987487793 	 loss mean: 117.4970474243164
nll mean: 108.1436767578125 	 kl mean: 9.09119987487793 	 loss mean: 117.23487854003906



                                               
100%|██████████| 10/10 [00:00<00:00, 20.95it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
 20%|██        | 2/10 [00:00<00:00, 12.16it/s][A

nll mean: 108.40534973144531 	 kl mean: 9.09119987487793 	 loss mean: 117.49654388427734
nll mean: 119.96038818359375 	 kl mean: 10.13045883178711 	 loss mean: 130.09085083007812
nll mean: 119.37077331542969 	 kl mean: 10.13045883178711 	 loss mean: 129.501220703125



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.19it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s][A

nll mean: 119.45339965820312 	 kl mean: 10.13045883178711 	 loss mean: 129.5838623046875
nll mean: 119.5948486328125 	 kl mean: 10.13045883178711 	 loss mean: 129.72531127929688
nll mean: 119.33061218261719 	 kl mean: 10.13045883178711 	 loss mean: 129.46109008789062



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.30it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.27it/s][A

nll mean: 119.35433197021484 	 kl mean: 10.13045883178711 	 loss mean: 129.4847869873047
nll mean: 119.90862274169922 	 kl mean: 10.13045883178711 	 loss mean: 130.03907775878906
nll mean: 119.46549987792969 	 kl mean: 10.13045883178711 	 loss mean: 129.595947265625



                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.83it/s][A
                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.83it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.27it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]

nll mean: 119.36734771728516 	 kl mean: 10.13045883178711 	 loss mean: 129.497802734375
nll mean: 119.76002502441406 	 kl mean: 10.13045883178711 	 loss mean: 129.89048767089844
nll mean: 60.96165466308594 	 kl mean: 10.565200805664062 	 loss mean: 71.52685546875



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 10.16it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.07it/s][A
                                               

nll mean: 60.59982681274414 	 kl mean: 10.565200805664062 	 loss mean: 71.16502380371094
nll mean: 60.599281311035156 	 kl mean: 10.565200805664062 	 loss mean: 71.16448211669922



 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.09it/s][A
[A                                           

nll mean: 60.904701232910156 	 kl mean: 10.565200805664062 	 loss mean: 71.46990203857422
nll mean: 60.63750457763672 	 kl mean: 10.565200805664062 	 loss mean: 71.20270538330078


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.97it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.98it/s][A
                                               


nll mean: 60.99009323120117 	 kl mean: 10.565200805664062 	 loss mean: 71.5552978515625
nll mean: 61.023406982421875 	 kl mean: 10.565200805664062 	 loss mean: 71.58860778808594
nll mean: 60.06368637084961 	 kl mean: 10.565200805664062 	 loss mean: 70.62889099121094


 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.96it/s][A
                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.59it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.95it/s][A
                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.59it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.97it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 60.6322135925293 	 kl mean: 10.565200805664062 	 loss mean: 71.19741821289062
nll mean: 60.70261001586914 	 kl mean: 10.565200805664062 	 loss mean: 71.26780700683594
nll mean: 102.50007629394531 	 kl mean: 9.705951690673828 	 loss mean: 112.2060317993164


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 20%|██        | 2/10 [00:00<00:00, 12.91it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.87it/s][A

nll mean: 102.48577880859375 	 kl mean: 9.705951690673828 	 loss mean: 112.19172668457031
nll mean: 102.95306396484375 	 kl mean: 9.705951690673828 	 loss mean: 112.65901184082031
nll mean: 102.06216430664062 	 kl mean: 9.705951690673828 	 loss mean: 111.76811218261719


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 40%|████      | 4/10 [00:00<00:00, 12.87it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.82it/s][A

nll mean: 102.70014190673828 	 kl mean: 9.705951690673828 	 loss mean: 112.40608978271484
nll mean: 102.341064453125 	 kl mean: 9.705951690673828 	 loss mean: 112.04701232910156
nll mean: 102.54002380371094 	 kl mean: 9.705951690673828 	 loss mean: 112.24598693847656


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.82it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.67it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.60it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 101.94866943359375 	 kl mean: 9.705951690673828 	 loss mean: 111.65463256835938
nll mean: 102.22724914550781 	 kl mean: 9.705951690673828 	 loss mean: 111.93321228027344
nll mean: 102.17908477783203 	 kl mean: 9.705951690673828 	 loss mean: 111.88504028320312


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.98it/s][A

nll mean: 135.3502197265625 	 kl mean: 10.734386444091797 	 loss mean: 146.08460998535156
nll mean: 135.25186157226562 	 kl mean: 10.734386444091797 	 loss mean: 145.98623657226562


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 20%|██        | 2/10 [00:00<00:00,  9.98it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00,  9.92it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.89it/s][A

nll mean: 135.12059020996094 	 kl mean: 10.734386444091797 	 loss mean: 145.85498046875
nll mean: 135.34185791015625 	 kl mean: 10.734386444091797 	 loss mean: 146.07623291015625


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 40%|████      | 4/10 [00:00<00:00,  9.89it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.91it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.83it/s][A

nll mean: 134.85047912597656 	 kl mean: 10.734386444091797 	 loss mean: 145.58486938476562
nll mean: 135.43679809570312 	 kl mean: 10.734386444091797 	 loss mean: 146.17117309570312


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.83it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.81it/s][A
                                               [A
                                              

nll mean: 135.29151916503906 	 kl mean: 10.734386444091797 	 loss mean: 146.02590942382812
nll mean: 135.36097717285156 	 kl mean: 10.734386444091797 	 loss mean: 146.09535217285156


 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.85it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.87it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.85it/s][A
 84%|████████▍ | 32/38 [00:20<00:05,  1.20it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]

nll mean: 135.5142822265625 	 kl mean: 10.734386444091797 	 loss mean: 146.24867248535156
nll mean: 135.28138732910156 	 kl mean: 10.734386444091797 	 loss mean: 146.01577758789062
nll mean: 63.637752532958984 	 kl mean: 8.33749008178711 	 loss mean: 71.9752426147461
nll mean: 63.46021270751953 	 kl mean: 8.33749008178711 	 loss mean: 71.7977066040039



                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
 30%|███       | 3/10 [00:00<00:00, 26.03it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.87it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s][A

nll mean: 63.13959503173828 	 kl mean: 8.33749008178711 	 loss mean: 71.47708892822266
nll mean: 63.324256896972656 	 kl mean: 8.33749008178711 	 loss mean: 71.6617431640625
nll mean: 63.76078414916992 	 kl mean: 8.33749008178711 	 loss mean: 72.09827423095703
nll mean: 63.67622756958008 	 kl mean: 8.33749008178711 	 loss mean: 72.01371765136719
nll mean: 63.66419219970703 	 kl mean: 8.33749008178711 	 loss mean: 72.0016860961914
nll mean: 63.475379943847656 	 kl mean: 8.33749008178711 	 loss mean: 71.8128662109375



                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.82it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.69it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
 30%|███       | 3/10 [00:00<00:00, 21.47it/s][A

nll mean: 64.10098266601562 	 kl mean: 8.33749008178711 	 loss mean: 72.43846130371094
nll mean: 63.654056549072266 	 kl mean: 8.33749008178711 	 loss mean: 71.99154663085938
nll mean: 118.58056640625 	 kl mean: 9.046307563781738 	 loss mean: 127.62687683105469
nll mean: 118.60386657714844 	 kl mean: 9.046307563781738 	 loss mean: 127.65017700195312
nll mean: 118.44464111328125 	 kl mean: 9.046307563781738 	 loss mean: 127.49095153808594



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.53it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A

nll mean: 118.63880920410156 	 kl mean: 9.046307563781738 	 loss mean: 127.68512725830078
nll mean: 118.35426330566406 	 kl mean: 9.046307563781738 	 loss mean: 127.40057373046875
nll mean: 118.33818054199219 	 kl mean: 9.046307563781738 	 loss mean: 127.38448333740234
nll mean: 118.58594512939453 	 kl mean: 9.046307563781738 	 loss mean: 127.63224792480469
nll mean: 118.74822998046875 	 kl mean: 9.046307563781738 	 loss mean: 127.79454803466797



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.58it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.60it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]

nll mean: 118.19415283203125 	 kl mean: 9.046307563781738 	 loss mean: 127.24046325683594
nll mean: 118.89567565917969 	 kl mean: 9.046307563781738 	 loss mean: 127.94197845458984
nll mean: 117.7188720703125 	 kl mean: 9.742961883544922 	 loss mean: 127.46183776855469



                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.15it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.21it/s][A

nll mean: 118.36319732666016 	 kl mean: 9.742961883544922 	 loss mean: 128.10617065429688
nll mean: 118.27328491210938 	 kl mean: 9.742961883544922 	 loss mean: 128.01625061035156
nll mean: 118.36949157714844 	 kl mean: 9.742961883544922 	 loss mean: 128.11245727539062



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.24it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A

nll mean: 118.11398315429688 	 kl mean: 9.742961883544922 	 loss mean: 127.85693359375
nll mean: 118.47084045410156 	 kl mean: 9.742961883544922 	 loss mean: 128.2137908935547
nll mean: 118.18577575683594 	 kl mean: 9.742961883544922 	 loss mean: 127.92872619628906



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.31it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.41it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.57142639160156 	 kl mean: 9.742961883544922 	 loss mean: 128.31439208984375
nll mean: 118.2249755859375 	 kl mean: 9.742961883544922 	 loss mean: 127.96794128417969
nll mean: 118.04234313964844 	 kl mean: 9.742961883544922 	 loss mean: 127.78530883789062



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.60it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s][A

nll mean: 112.88408660888672 	 kl mean: 9.328304290771484 	 loss mean: 122.21238708496094
nll mean: 112.14328002929688 	 kl mean: 9.328304290771484 	 loss mean: 121.47158813476562
nll mean: 112.5155029296875 	 kl mean: 9.328304290771484 	 loss mean: 121.84381103515625



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.59it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.58it/s][A

nll mean: 112.83123016357422 	 kl mean: 9.328304290771484 	 loss mean: 122.15953063964844
nll mean: 112.51438903808594 	 kl mean: 9.328304290771484 	 loss mean: 121.84268951416016
nll mean: 112.56144714355469 	 kl mean: 9.328304290771484 	 loss mean: 121.88975524902344



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.64it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A

nll mean: 112.39369201660156 	 kl mean: 9.328304290771484 	 loss mean: 121.72199249267578
nll mean: 113.14906311035156 	 kl mean: 9.328304290771484 	 loss mean: 122.47737121582031
nll mean: 112.77505493164062 	 kl mean: 9.328304290771484 	 loss mean: 122.10336303710938



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.61it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 22.71it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A

nll mean: 112.38516235351562 	 kl mean: 9.328304290771484 	 loss mean: 121.71347045898438
nll mean: 110.28667449951172 	 kl mean: 9.691522598266602 	 loss mean: 119.97819519042969
nll mean: 110.11325073242188 	 kl mean: 9.691522598266602 	 loss mean: 119.80477142333984
nll mean: 110.64639282226562 	 kl mean: 9.691522598266602 	 loss mean: 120.33792114257812
nll mean: 109.7309799194336 	 kl mean: 9.691522598266602 	 loss mean: 119.42250061035156



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
 50%|█████     | 5/10 [00:00<00:00, 21.82it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
 80%|████████  | 8/10 [00:00<00:00, 21.58it/s][A
                                               
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s][A

nll mean: 110.27668762207031 	 kl mean: 9.691522598266602 	 loss mean: 119.96821594238281
nll mean: 109.87527465820312 	 kl mean: 9.691522598266602 	 loss mean: 119.5667953491211
nll mean: 110.40324401855469 	 kl mean: 9.691522598266602 	 loss mean: 120.09476470947266
nll mean: 109.81342315673828 	 kl mean: 9.691522598266602 	 loss mean: 119.50494384765625
nll mean: 109.81180572509766 	 kl mean: 9.691522598266602 	 loss mean: 119.50332641601562



                                               
100%|██████████| 10/10 [00:00<00:00, 21.18it/s][A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 30.47it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s][A
[A                                           

nll mean: 110.29978942871094 	 kl mean: 9.691522598266602 	 loss mean: 119.99130249023438
nll mean: 85.45195770263672 	 kl mean: 10.08852767944336 	 loss mean: 95.54048919677734
nll mean: 85.78335571289062 	 kl mean: 10.08852767944336 	 loss mean: 95.87188720703125
nll mean: 84.8653793334961 	 kl mean: 10.08852767944336 	 loss mean: 94.95390319824219
nll mean: 84.63709259033203 	 kl mean: 10.08852767944336 	 loss mean: 94.72561645507812
nll mean: 85.0445785522461 	 kl mean: 10.08852767944336 	 loss mean: 95.13311004638672


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s][A
 80%|████████  | 8/10 [00:00<00:00, 30.41it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 30.35it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.56it/s]


nll mean: 85.49836730957031 	 kl mean: 10.08852767944336 	 loss mean: 95.58689880371094
nll mean: 85.36749267578125 	 kl mean: 10.08852767944336 	 loss mean: 95.45601654052734
nll mean: 85.12367248535156 	 kl mean: 10.08852767944336 	 loss mean: 95.21220397949219
nll mean: 85.46353149414062 	 kl mean: 10.08852767944336 	 loss mean: 95.55206298828125
nll mean: 85.22999572753906 	 kl mean: 10.08852767944336 	 loss mean: 95.31852722167969
Approximate NLL:
tensor(120.0548, device='cuda:0')
Approximate KL:
tensor(9.7923, device='cuda:0')
Testing took 0:00:25.453109


  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .61it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .61it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .61it/s][A
                                              

nll mean: 107.97981262207031 	 kl mean: 10.369463920593262 	 loss mean: 118.34927368164062
nll mean: 107.73157501220703 	 kl mean: 10.369463920593262 	 loss mean: 118.10103607177734
nll mean: 107.51216125488281 	 kl mean: 10.369463920593262 	 loss mean: 117.88162231445312
nll mean: 107.37135314941406 	 kl mean: 10.369463920593262 	 loss mean: 117.74081420898438
nll mean: 108.29737091064453 	 kl mean: 10.369463920593262 	 loss mean: 118.66683197021484


  0%|          | 0/38 [00:00<?, ?it/s]
 30%|███       | 3/10 [00:00<00:00, 25.61it/s][A
                                      .40it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .40it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .40it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 25.40it/s][A
                                      .29it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 25.15it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 107.88233947753906 	 kl mean: 10.369463920593262 	 loss mean: 118.25180053710938
nll mean: 107.27119445800781 	 kl mean: 10.369463920593262 	 loss mean: 117.64065551757812
nll mean: 107.72810363769531 	 kl mean: 10.369463920593262 	 loss mean: 118.09756469726562
nll mean: 108.09144592285156 	 kl mean: 10.369463920593262 	 loss mean: 118.46089935302734
nll mean: 107.5330810546875 	 kl mean: 10.369463920593262 	 loss mean: 117.90254974365234


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 20%|██        | 2/10 [00:00<00:00, 13.98it/s][A

nll mean: 124.56088256835938 	 kl mean: 9.95506477355957 	 loss mean: 134.51596069335938
nll mean: 125.11537170410156 	 kl mean: 9.95506477355957 	 loss mean: 135.0704345703125
nll mean: 125.0589599609375 	 kl mean: 9.95506477355957 	 loss mean: 135.01400756835938


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 20%|██        | 2/10 [00:00<00:00, 13.98it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 40%|████      | 4/10 [00:00<00:00, 14.16it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.14it/s][A

nll mean: 124.40682983398438 	 kl mean: 9.95506477355957 	 loss mean: 134.36187744140625
nll mean: 125.17990112304688 	 kl mean: 9.95506477355957 	 loss mean: 135.13494873046875
nll mean: 124.84205627441406 	 kl mean: 9.95506477355957 	 loss mean: 134.797119140625


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.14it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.04it/s][A

nll mean: 125.19841003417969 	 kl mean: 9.95506477355957 	 loss mean: 135.15347290039062
nll mean: 124.89216613769531 	 kl mean: 9.95506477355957 	 loss mean: 134.84722900390625
nll mean: 125.14520263671875 	 kl mean: 9.95506477355957 	 loss mean: 135.10028076171875


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.04it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.10it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 30%|███       | 3/10 [00:00<00:00, 24.82it/s][A

nll mean: 124.520751953125 	 kl mean: 9.95506477355957 	 loss mean: 134.475830078125
nll mean: 97.82432556152344 	 kl mean: 9.094049453735352 	 loss mean: 106.91838073730469
nll mean: 98.07440185546875 	 kl mean: 9.094049453735352 	 loss mean: 107.16844940185547
nll mean: 98.00363159179688 	 kl mean: 9.094049453735352 	 loss mean: 107.09768676757812
nll mean: 98.2534408569336 	 kl mean: 9.094049453735352 	 loss mean: 107.34748840332031


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 30%|███       | 3/10 [00:00<00:00, 24.82it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.55it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.49it/s][A

nll mean: 97.52603149414062 	 kl mean: 9.094049453735352 	 loss mean: 106.62007904052734
nll mean: 97.95709991455078 	 kl mean: 9.094049453735352 	 loss mean: 107.0511474609375
nll mean: 98.3414535522461 	 kl mean: 9.094049453735352 	 loss mean: 107.43550109863281
nll mean: 98.02184295654297 	 kl mean: 9.094049453735352 	 loss mean: 107.11589813232422
nll mean: 98.05168151855469 	 kl mean: 9.094049453735352 	 loss mean: 107.14573669433594


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
100%|██████████| 10/10 [00:00<00:00, 24.16it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.83it/s][A

nll mean: 98.19925689697266 	 kl mean: 9.094049453735352 	 loss mean: 107.29331970214844
nll mean: 137.21868896484375 	 kl mean: 9.4039888381958 	 loss mean: 146.6226806640625
nll mean: 136.6162109375 	 kl mean: 9.4039888381958 	 loss mean: 146.0201873779297


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
 20%|██        | 2/10 [00:00<00:00, 10.83it/s][A
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.13it/s]
 40%|████      | 4/10 [00:00<00:00, 10.83it/s][A

nll mean: 136.86102294921875 	 kl mean: 9.4039888381958 	 loss mean: 146.26499938964844
nll mean: 137.09793090820312 	 kl mean: 9.4039888381958 	 loss mean: 146.50192260742188
nll mean: 137.1024932861328 	 kl mean: 9.4039888381958 	 loss mean: 146.50648498535156


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s]
 40%|████      | 4/10 [00:00<00:00, 10.83it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.80it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.76it/s][A

nll mean: 136.84735107421875 	 kl mean: 9.4039888381958 	 loss mean: 146.25132751464844
nll mean: 136.56292724609375 	 kl mean: 9.4039888381958 	 loss mean: 145.96693420410156
nll mean: 136.64889526367188 	 kl mean: 9.4039888381958 	 loss mean: 146.05288696289062


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.13it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.76it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.72it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 136.6942901611328 	 kl mean: 9.4039888381958 	 loss mean: 146.09829711914062
nll mean: 137.18511962890625 	 kl mean: 9.4039888381958 	 loss mean: 146.589111328125
nll mean: 123.1854476928711 	 kl mean: 9.351022720336914 	 loss mean: 132.53646850585938


                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 20%|██        | 2/10 [00:00<00:00, 13.41it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.54it/s][A

nll mean: 122.81443786621094 	 kl mean: 9.351022720336914 	 loss mean: 132.16546630859375
nll mean: 122.54757690429688 	 kl mean: 9.351022720336914 	 loss mean: 131.89859008789062
nll mean: 123.24394226074219 	 kl mean: 9.351022720336914 	 loss mean: 132.59495544433594


                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 40%|████      | 4/10 [00:00<00:00, 13.54it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.62it/s][A

nll mean: 122.567138671875 	 kl mean: 9.351022720336914 	 loss mean: 131.91815185546875
nll mean: 122.63997650146484 	 kl mean: 9.351022720336914 	 loss mean: 131.99099731445312
nll mean: 122.69781494140625 	 kl mean: 9.351022720336914 	 loss mean: 132.04884338378906


                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.62it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.75it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.80it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 122.5604476928711 	 kl mean: 9.351022720336914 	 loss mean: 131.91146850585938
nll mean: 122.59294891357422 	 kl mean: 9.351022720336914 	 loss mean: 131.9439697265625
nll mean: 122.09938049316406 	 kl mean: 9.351022720336914 	 loss mean: 131.45040893554688


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.55it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 13.74it/s][A

nll mean: 122.36517333984375 	 kl mean: 9.414244651794434 	 loss mean: 131.7794189453125
nll mean: 122.27925109863281 	 kl mean: 9.414244651794434 	 loss mean: 131.69349670410156
nll mean: 122.46675872802734 	 kl mean: 9.414244651794434 	 loss mean: 131.88099670410156


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 13.74it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.55it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.55it/s]
 40%|████      | 4/10 [00:00<00:00, 13.78it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.04it/s][A

nll mean: 122.74104309082031 	 kl mean: 9.414244651794434 	 loss mean: 132.15530395507812
nll mean: 122.56986236572266 	 kl mean: 9.414244651794434 	 loss mean: 131.98410034179688
nll mean: 122.33296203613281 	 kl mean: 9.414244651794434 	 loss mean: 131.74720764160156


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.55it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.04it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.55it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.22it/s][A

nll mean: 122.69654846191406 	 kl mean: 9.414244651794434 	 loss mean: 132.11077880859375
nll mean: 122.14124298095703 	 kl mean: 9.414244651794434 	 loss mean: 131.55548095703125
nll mean: 122.35130310058594 	 kl mean: 9.414244651794434 	 loss mean: 131.76556396484375


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.55it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.22it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.14it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.50it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.50it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.50it/s]
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.50it/s]
 30%|███       | 3/10 [00:00<00:00, 25.11it/s][A

nll mean: 122.23640441894531 	 kl mean: 9.414244651794434 	 loss mean: 131.65065002441406
nll mean: 131.68115234375 	 kl mean: 9.484764099121094 	 loss mean: 141.16592407226562
nll mean: 131.4526824951172 	 kl mean: 9.484764099121094 	 loss mean: 140.93743896484375
nll mean: 131.71804809570312 	 kl mean: 9.484764099121094 	 loss mean: 141.2028045654297
nll mean: 131.70993041992188 	 kl mean: 9.484764099121094 	 loss mean: 141.19467163085938


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.50it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.50it/s]
 30%|███       | 3/10 [00:00<00:00, 25.11it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.50it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.50it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.09it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.98it/s][A

nll mean: 131.8128662109375 	 kl mean: 9.484764099121094 	 loss mean: 141.29763793945312
nll mean: 131.50027465820312 	 kl mean: 9.484764099121094 	 loss mean: 140.98504638671875
nll mean: 132.04229736328125 	 kl mean: 9.484764099121094 	 loss mean: 141.52706909179688
nll mean: 131.82574462890625 	 kl mean: 9.484764099121094 	 loss mean: 141.3105010986328
nll mean: 131.3385772705078 	 kl mean: 9.484764099121094 	 loss mean: 140.82334899902344


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.50it/s]
100%|██████████| 10/10 [00:00<00:00, 24.87it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 25.24it/s][A

nll mean: 131.12738037109375 	 kl mean: 9.484764099121094 	 loss mean: 140.61212158203125
nll mean: 103.30503845214844 	 kl mean: 9.3101806640625 	 loss mean: 112.61521911621094
nll mean: 103.3366470336914 	 kl mean: 9.3101806640625 	 loss mean: 112.6468276977539
nll mean: 103.85641479492188 	 kl mean: 9.3101806640625 	 loss mean: 113.16659545898438
nll mean: 103.69279479980469 	 kl mean: 9.3101806640625 	 loss mean: 113.00297546386719


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 25.24it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.17it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.03it/s][A

nll mean: 103.57106018066406 	 kl mean: 9.3101806640625 	 loss mean: 112.88124084472656
nll mean: 103.69537353515625 	 kl mean: 9.3101806640625 	 loss mean: 113.00555419921875
nll mean: 103.39462280273438 	 kl mean: 9.3101806640625 	 loss mean: 112.70480346679688
nll mean: 103.34986877441406 	 kl mean: 9.3101806640625 	 loss mean: 112.66004943847656
nll mean: 103.34844970703125 	 kl mean: 9.3101806640625 	 loss mean: 112.65863037109375


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
100%|██████████| 10/10 [00:00<00:00, 24.95it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.78it/s][A

nll mean: 103.43898010253906 	 kl mean: 9.3101806640625 	 loss mean: 112.74916076660156
nll mean: 129.50173950195312 	 kl mean: 10.145848274230957 	 loss mean: 139.6475830078125
nll mean: 129.45758056640625 	 kl mean: 10.145848274230957 	 loss mean: 139.6034393310547


                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
 20%|██        | 2/10 [00:00<00:00, 14.78it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 40%|████      | 4/10 [00:00<00:00, 14.80it/s][A

nll mean: 129.5727996826172 	 kl mean: 10.145848274230957 	 loss mean: 139.71865844726562
nll mean: 129.39060974121094 	 kl mean: 10.145848274230957 	 loss mean: 139.53646850585938
nll mean: 129.9352264404297 	 kl mean: 10.145848274230957 	 loss mean: 140.08108520507812


                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 40%|████      | 4/10 [00:00<00:00, 14.80it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.64it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.94it/s][A

nll mean: 129.28433227539062 	 kl mean: 10.145848274230957 	 loss mean: 139.43017578125
nll mean: 129.89791870117188 	 kl mean: 10.145848274230957 	 loss mean: 140.04379272460938
nll mean: 129.7630615234375 	 kl mean: 10.145848274230957 	 loss mean: 139.90890502929688
nll mean: 129.60736083984375 	 kl mean: 10.145848274230957 	 loss mean: 139.75320434570312


                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.94it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.95it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 22.16it/s][A

nll mean: 129.23211669921875 	 kl mean: 10.145848274230957 	 loss mean: 139.37796020507812
nll mean: 129.12271118164062 	 kl mean: 9.67122745513916 	 loss mean: 138.7939453125
nll mean: 129.083251953125 	 kl mean: 9.67122745513916 	 loss mean: 138.75448608398438
nll mean: 129.958251953125 	 kl mean: 9.67122745513916 	 loss mean: 139.6294708251953
nll mean: 129.53134155273438 	 kl mean: 9.67122745513916 	 loss mean: 139.2025604248047


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 22.16it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.77it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.55it/s][A

nll mean: 129.49838256835938 	 kl mean: 9.67122745513916 	 loss mean: 139.16958618164062
nll mean: 129.45480346679688 	 kl mean: 9.67122745513916 	 loss mean: 139.12603759765625
nll mean: 129.578369140625 	 kl mean: 9.67122745513916 	 loss mean: 139.24960327148438
nll mean: 128.94064331054688 	 kl mean: 9.67122745513916 	 loss mean: 138.61187744140625
nll mean: 129.0651397705078 	 kl mean: 9.67122745513916 	 loss mean: 138.73635864257812


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
100%|██████████| 10/10 [00:00<00:00, 21.25it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 30%|███       | 3/10 [00:00<00:00, 24.74it/s][A

nll mean: 129.1322021484375 	 kl mean: 9.67122745513916 	 loss mean: 138.80343627929688
nll mean: 115.34764099121094 	 kl mean: 9.945528030395508 	 loss mean: 125.29315948486328
nll mean: 114.94026184082031 	 kl mean: 9.945528030395508 	 loss mean: 124.88578796386719
nll mean: 115.22038269042969 	 kl mean: 9.945528030395508 	 loss mean: 125.16590881347656
nll mean: 115.43688201904297 	 kl mean: 9.945528030395508 	 loss mean: 125.3824234008789


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 30%|███       | 3/10 [00:00<00:00, 24.74it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.62it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.58it/s][A

nll mean: 115.45973205566406 	 kl mean: 9.945528030395508 	 loss mean: 125.40525817871094
nll mean: 115.28172302246094 	 kl mean: 9.945528030395508 	 loss mean: 125.22724914550781
nll mean: 115.23111724853516 	 kl mean: 9.945528030395508 	 loss mean: 125.17665100097656
nll mean: 115.5507583618164 	 kl mean: 9.945528030395508 	 loss mean: 125.49629211425781
nll mean: 114.92867279052734 	 kl mean: 9.945528030395508 	 loss mean: 124.87420654296875


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
100%|██████████| 10/10 [00:00<00:00, 24.46it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 30%|███       | 3/10 [00:00<00:00, 21.31it/s][A

nll mean: 114.92215728759766 	 kl mean: 9.945528030395508 	 loss mean: 124.86767578125
nll mean: 139.50108337402344 	 kl mean: 9.527970314025879 	 loss mean: 149.02903747558594
nll mean: 139.39361572265625 	 kl mean: 9.527970314025879 	 loss mean: 148.92160034179688
nll mean: 139.3109893798828 	 kl mean: 9.527970314025879 	 loss mean: 148.83895874023438
nll mean: 139.58700561523438 	 kl mean: 9.527970314025879 	 loss mean: 149.114990234375


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 30%|███       | 3/10 [00:00<00:00, 21.31it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.30it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.18it/s][A

nll mean: 140.077880859375 	 kl mean: 9.527970314025879 	 loss mean: 149.60586547851562
nll mean: 139.51805114746094 	 kl mean: 9.527970314025879 	 loss mean: 149.0460205078125
nll mean: 139.8203125 	 kl mean: 9.527970314025879 	 loss mean: 149.34828186035156
nll mean: 139.59349060058594 	 kl mean: 9.527970314025879 	 loss mean: 149.1214599609375
nll mean: 139.80718994140625 	 kl mean: 9.527970314025879 	 loss mean: 149.33514404296875


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
100%|██████████| 10/10 [00:00<00:00, 20.98it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.72it/s][A

nll mean: 139.19461059570312 	 kl mean: 9.527970314025879 	 loss mean: 148.72256469726562
nll mean: 118.35401153564453 	 kl mean: 10.035866737365723 	 loss mean: 128.38987731933594
nll mean: 118.49546813964844 	 kl mean: 10.035866737365723 	 loss mean: 128.53134155273438


                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 20%|██        | 2/10 [00:00<00:00, 12.72it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 40%|████      | 4/10 [00:00<00:00, 12.74it/s][A

nll mean: 118.92897033691406 	 kl mean: 10.035866737365723 	 loss mean: 128.96484375
nll mean: 118.69679260253906 	 kl mean: 10.035866737365723 	 loss mean: 128.73265075683594
nll mean: 118.93782043457031 	 kl mean: 10.035866737365723 	 loss mean: 128.9736785888672


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 40%|████      | 4/10 [00:00<00:00, 12.74it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.61it/s][A

nll mean: 118.67607879638672 	 kl mean: 10.035866737365723 	 loss mean: 128.71194458007812
nll mean: 118.99138641357422 	 kl mean: 10.035866737365723 	 loss mean: 129.02725219726562
nll mean: 118.98938751220703 	 kl mean: 10.035866737365723 	 loss mean: 129.02525329589844


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.61it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.59it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.406005859375 	 kl mean: 10.035866737365723 	 loss mean: 128.44187927246094
nll mean: 118.31916809082031 	 kl mean: 10.035866737365723 	 loss mean: 128.35504150390625
nll mean: 159.0229949951172 	 kl mean: 10.448759078979492 	 loss mean: 169.47174072265625


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 20%|██        | 2/10 [00:00<00:00,  9.89it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.83it/s][A

nll mean: 159.00982666015625 	 kl mean: 10.448759078979492 	 loss mean: 169.45858764648438
nll mean: 158.15673828125 	 kl mean: 10.448759078979492 	 loss mean: 168.60549926757812


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00,  9.83it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 40%|████      | 4/10 [00:00<00:00,  9.81it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.81it/s][A

nll mean: 158.85678100585938 	 kl mean: 10.448759078979492 	 loss mean: 169.3055419921875
nll mean: 159.15121459960938 	 kl mean: 10.448759078979492 	 loss mean: 169.5999755859375


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.81it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.82it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.81it/s][A

nll mean: 158.712646484375 	 kl mean: 10.448759078979492 	 loss mean: 169.16140747070312
nll mean: 158.74566650390625 	 kl mean: 10.448759078979492 	 loss mean: 169.19442749023438


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.81it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.85it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.85it/s][A

nll mean: 158.1653594970703 	 kl mean: 10.448759078979492 	 loss mean: 168.61412048339844
nll mean: 159.299560546875 	 kl mean: 10.448759078979492 	 loss mean: 169.74832153320312


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.85it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.83it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.57it/s][A

nll mean: 159.30197143554688 	 kl mean: 10.448759078979492 	 loss mean: 169.750732421875
nll mean: 133.0669403076172 	 kl mean: 9.316023826599121 	 loss mean: 142.38296508789062
nll mean: 133.14376831054688 	 kl mean: 9.316023826599121 	 loss mean: 142.4597930908203
nll mean: 133.30258178710938 	 kl mean: 9.316023826599121 	 loss mean: 142.6186065673828


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.57it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 18.31it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 18.23it/s][A

nll mean: 132.71087646484375 	 kl mean: 9.316023826599121 	 loss mean: 142.0269012451172
nll mean: 133.52011108398438 	 kl mean: 9.316023826599121 	 loss mean: 142.83615112304688
nll mean: 133.39788818359375 	 kl mean: 9.316023826599121 	 loss mean: 142.71392822265625
nll mean: 133.02085876464844 	 kl mean: 9.316023826599121 	 loss mean: 142.33688354492188


                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 18.23it/s][A
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 18.11it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.95it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 133.65432739257812 	 kl mean: 9.316023826599121 	 loss mean: 142.97035217285156
nll mean: 133.29519653320312 	 kl mean: 9.316023826599121 	 loss mean: 142.6112060546875
nll mean: 133.24574279785156 	 kl mean: 9.316023826599121 	 loss mean: 142.561767578125


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 20%|██        | 2/10 [00:00<00:00, 10.48it/s][A

nll mean: 140.33889770507812 	 kl mean: 10.21552848815918 	 loss mean: 150.55442810058594
nll mean: 139.74679565429688 	 kl mean: 10.21552848815918 	 loss mean: 149.96231079101562
nll mean: 140.20045471191406 	 kl mean: 10.21552848815918 	 loss mean: 150.41598510742188


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 20%|██        | 2/10 [00:00<00:00, 10.48it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 10.54it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.60it/s][A

nll mean: 140.075439453125 	 kl mean: 10.21552848815918 	 loss mean: 150.29098510742188
nll mean: 139.82577514648438 	 kl mean: 10.21552848815918 	 loss mean: 150.04132080078125
nll mean: 139.44924926757812 	 kl mean: 10.21552848815918 	 loss mean: 149.66476440429688


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.60it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.60it/s][A

nll mean: 139.99903869628906 	 kl mean: 10.21552848815918 	 loss mean: 150.21456909179688
nll mean: 139.97386169433594 	 kl mean: 10.21552848815918 	 loss mean: 150.18939208984375
nll mean: 139.7352752685547 	 kl mean: 10.21552848815918 	 loss mean: 149.9508056640625


                                               
 39%|███▉      | 15/38 [00:10<00:15,  1.49it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.60it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.60it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 24.33it/s][A

nll mean: 140.32730102539062 	 kl mean: 10.21552848815918 	 loss mean: 150.54281616210938
nll mean: 143.05722045898438 	 kl mean: 9.300888061523438 	 loss mean: 152.3581085205078
nll mean: 143.7022705078125 	 kl mean: 9.300888061523438 	 loss mean: 153.003173828125
nll mean: 143.73602294921875 	 kl mean: 9.300888061523438 	 loss mean: 153.0369110107422
nll mean: 143.47767639160156 	 kl mean: 9.300888061523438 	 loss mean: 152.778564453125


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 24.33it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.31it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.36it/s][A

nll mean: 143.5872344970703 	 kl mean: 9.300888061523438 	 loss mean: 152.88812255859375
nll mean: 143.60012817382812 	 kl mean: 9.300888061523438 	 loss mean: 152.90101623535156
nll mean: 143.58273315429688 	 kl mean: 9.300888061523438 	 loss mean: 152.8836212158203
nll mean: 143.780517578125 	 kl mean: 9.300888061523438 	 loss mean: 153.08140563964844
nll mean: 143.28350830078125 	 kl mean: 9.300888061523438 	 loss mean: 152.58438110351562


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
100%|██████████| 10/10 [00:00<00:00, 24.35it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A


nll mean: 143.5531463623047 	 kl mean: 9.300888061523438 	 loss mean: 152.85403442382812
nll mean: 131.30360412597656 	 kl mean: 9.548248291015625 	 loss mean: 140.8518524169922
nll mean: 131.26246643066406 	 kl mean: 9.548248291015625 	 loss mean: 140.81072998046875
nll mean: 130.9709014892578 	 kl mean: 9.548248291015625 	 loss mean: 140.51914978027344
nll mean: 131.4334259033203 	 kl mean: 9.548248291015625 	 loss mean: 140.98167419433594


 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 30%|███       | 3/10 [00:00<00:00, 25.24it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.20it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.04it/s][A

nll mean: 130.95591735839844 	 kl mean: 9.548248291015625 	 loss mean: 140.504150390625
nll mean: 131.52786254882812 	 kl mean: 9.548248291015625 	 loss mean: 141.07611083984375
nll mean: 131.18910217285156 	 kl mean: 9.548248291015625 	 loss mean: 140.73733520507812
nll mean: 130.88949584960938 	 kl mean: 9.548248291015625 	 loss mean: 140.43775939941406
nll mean: 131.32566833496094 	 kl mean: 9.548248291015625 	 loss mean: 140.87391662597656


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
100%|██████████| 10/10 [00:00<00:00, 24.93it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.53it/s][A

nll mean: 131.63821411132812 	 kl mean: 9.548248291015625 	 loss mean: 141.18646240234375
nll mean: 128.89971923828125 	 kl mean: 10.109997749328613 	 loss mean: 139.00973510742188
nll mean: 128.5086669921875 	 kl mean: 10.109997749328613 	 loss mean: 138.61865234375


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 20%|██        | 2/10 [00:00<00:00, 12.53it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 40%|████      | 4/10 [00:00<00:00, 12.50it/s][A

nll mean: 128.61962890625 	 kl mean: 10.109997749328613 	 loss mean: 138.7296142578125
nll mean: 128.5164337158203 	 kl mean: 10.109997749328613 	 loss mean: 138.62643432617188
nll mean: 128.3275604248047 	 kl mean: 10.109997749328613 	 loss mean: 138.43756103515625


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 40%|████      | 4/10 [00:00<00:00, 12.50it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.47it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.39it/s][A

nll mean: 128.88543701171875 	 kl mean: 10.109997749328613 	 loss mean: 138.99545288085938
nll mean: 129.28048706054688 	 kl mean: 10.109997749328613 	 loss mean: 139.3905029296875
nll mean: 129.02996826171875 	 kl mean: 10.109997749328613 	 loss mean: 139.13995361328125


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.39it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.35it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 128.88548278808594 	 kl mean: 10.109997749328613 	 loss mean: 138.9954833984375
nll mean: 128.61868286132812 	 kl mean: 10.109997749328613 	 loss mean: 138.72866821289062
nll mean: 146.21890258789062 	 kl mean: 10.151653289794922 	 loss mean: 156.37054443359375


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
 20%|██        | 2/10 [00:00<00:00, 12.63it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.62it/s][A

nll mean: 146.51480102539062 	 kl mean: 10.151653289794922 	 loss mean: 156.6664581298828
nll mean: 145.9268035888672 	 kl mean: 10.151653289794922 	 loss mean: 156.07843017578125
nll mean: 146.1658935546875 	 kl mean: 10.151653289794922 	 loss mean: 156.31753540039062


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
 40%|████      | 4/10 [00:00<00:00, 12.62it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.52it/s][A

nll mean: 145.8653564453125 	 kl mean: 10.151653289794922 	 loss mean: 156.0170135498047
nll mean: 146.39306640625 	 kl mean: 10.151653289794922 	 loss mean: 156.54473876953125
nll mean: 146.19107055664062 	 kl mean: 10.151653289794922 	 loss mean: 156.34274291992188


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.52it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.45it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.44it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 146.9019775390625 	 kl mean: 10.151653289794922 	 loss mean: 157.0536346435547
nll mean: 146.4752197265625 	 kl mean: 10.151653289794922 	 loss mean: 156.6268768310547
nll mean: 146.26812744140625 	 kl mean: 10.151653289794922 	 loss mean: 156.41976928710938


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 20%|██        | 2/10 [00:00<00:00, 12.65it/s][A

nll mean: 154.22796630859375 	 kl mean: 9.37896728515625 	 loss mean: 163.60693359375
nll mean: 154.3328399658203 	 kl mean: 9.37896728515625 	 loss mean: 163.71182250976562
nll mean: 154.94760131835938 	 kl mean: 9.37896728515625 	 loss mean: 164.32656860351562


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 20%|██        | 2/10 [00:00<00:00, 12.65it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 40%|████      | 4/10 [00:00<00:00, 12.53it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.51it/s][A

nll mean: 154.64761352539062 	 kl mean: 9.37896728515625 	 loss mean: 164.02658081054688
nll mean: 154.3455810546875 	 kl mean: 9.37896728515625 	 loss mean: 163.72454833984375
nll mean: 154.57293701171875 	 kl mean: 9.37896728515625 	 loss mean: 163.951904296875


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.51it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.43it/s][A

nll mean: 154.50689697265625 	 kl mean: 9.37896728515625 	 loss mean: 163.8858642578125
nll mean: 154.84840393066406 	 kl mean: 9.37896728515625 	 loss mean: 164.2273712158203
nll mean: 154.78549194335938 	 kl mean: 9.37896728515625 	 loss mean: 164.16445922851562


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.43it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.36it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 154.54981994628906 	 kl mean: 9.37896728515625 	 loss mean: 163.92877197265625
nll mean: 116.43836975097656 	 kl mean: 9.625526428222656 	 loss mean: 126.06388854980469
nll mean: 116.1887435913086 	 kl mean: 9.625526428222656 	 loss mean: 125.81427001953125



                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 10.23it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
 40%|████      | 4/10 [00:00<00:00, 10.28it/s][A

nll mean: 116.29668426513672 	 kl mean: 9.625526428222656 	 loss mean: 125.92221069335938
nll mean: 116.486083984375 	 kl mean: 9.625526428222656 	 loss mean: 126.11161804199219
nll mean: 116.61032104492188 	 kl mean: 9.625526428222656 	 loss mean: 126.23583984375


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
 40%|████      | 4/10 [00:00<00:00, 10.28it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.27it/s][A


nll mean: 116.36524963378906 	 kl mean: 9.625526428222656 	 loss mean: 125.99076843261719
nll mean: 116.10711669921875 	 kl mean: 9.625526428222656 	 loss mean: 125.73265075683594
nll mean: 116.33283996582031 	 kl mean: 9.625526428222656 	 loss mean: 125.95835876464844


                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.22it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.26it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 116.69921112060547 	 kl mean: 9.625526428222656 	 loss mean: 126.32473754882812
nll mean: 116.6547622680664 	 kl mean: 9.625526428222656 	 loss mean: 126.28028869628906
nll mean: 104.13960266113281 	 kl mean: 8.984607696533203 	 loss mean: 113.12420654296875
nll mean: 104.15657806396484 	 kl mean: 8.984607696533203 	 loss mean: 113.14118957519531
nll mean: 103.42743682861328 	 kl mean: 8.984607696533203 	 loss mean: 112.41204833984375


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
 40%|████      | 4/10 [00:00<00:00, 33.18it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
100%|██████████| 10/10 [00:00<00:00, 32.58it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 103.96733093261719 	 kl mean: 8.984607696533203 	 loss mean: 112.95194244384766
nll mean: 104.17025756835938 	 kl mean: 8.984607696533203 	 loss mean: 113.15486145019531
nll mean: 103.87995910644531 	 kl mean: 8.984607696533203 	 loss mean: 112.86456298828125
nll mean: 103.6732177734375 	 kl mean: 8.984607696533203 	 loss mean: 112.65782928466797
nll mean: 103.60220336914062 	 kl mean: 8.984607696533203 	 loss mean: 112.58682250976562
nll mean: 103.397705078125 	 kl mean: 8.984607696533203 	 loss mean: 112.38231658935547
nll mean: 104.05693054199219 	 kl mean: 8.984607696533203 	 loss mean: 113.04153442382812


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.50it/s][A

nll mean: 155.37423706054688 	 kl mean: 9.512740135192871 	 loss mean: 164.88697814941406
nll mean: 154.6153564453125 	 kl mean: 9.512740135192871 	 loss mean: 164.12808227539062
nll mean: 154.6644744873047 	 kl mean: 9.512740135192871 	 loss mean: 164.17721557617188


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.50it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 40%|████      | 4/10 [00:00<00:00, 14.56it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.59it/s][A

nll mean: 155.00204467773438 	 kl mean: 9.512740135192871 	 loss mean: 164.5147705078125
nll mean: 154.89395141601562 	 kl mean: 9.512740135192871 	 loss mean: 164.40670776367188
nll mean: 155.0107879638672 	 kl mean: 9.512740135192871 	 loss mean: 164.52352905273438


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.59it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.65it/s][A

nll mean: 155.23593139648438 	 kl mean: 9.512740135192871 	 loss mean: 164.74867248535156
nll mean: 155.53054809570312 	 kl mean: 9.512740135192871 	 loss mean: 165.04330444335938
nll mean: 155.44699096679688 	 kl mean: 9.512740135192871 	 loss mean: 164.95973205566406


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.67it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 21.58it/s][A

nll mean: 154.939453125 	 kl mean: 9.512740135192871 	 loss mean: 164.4521942138672
nll mean: 119.67582702636719 	 kl mean: 10.130712509155273 	 loss mean: 129.80653381347656
nll mean: 119.32102966308594 	 kl mean: 10.130712509155273 	 loss mean: 129.4517364501953
nll mean: 119.5146713256836 	 kl mean: 10.130712509155273 	 loss mean: 129.6453857421875
nll mean: 120.1002197265625 	 kl mean: 10.130712509155273 	 loss mean: 130.23092651367188


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 21.58it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.40it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.40it/s][A

nll mean: 120.08584594726562 	 kl mean: 10.130712509155273 	 loss mean: 130.21656799316406
nll mean: 119.19865417480469 	 kl mean: 10.130712509155273 	 loss mean: 129.32937622070312
nll mean: 119.19015502929688 	 kl mean: 10.130712509155273 	 loss mean: 129.32086181640625
nll mean: 119.76730346679688 	 kl mean: 10.130712509155273 	 loss mean: 129.89801025390625
nll mean: 119.25751495361328 	 kl mean: 10.130712509155273 	 loss mean: 129.3882293701172


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 21.36it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.46it/s][A

nll mean: 119.85972595214844 	 kl mean: 10.130712509155273 	 loss mean: 129.9904327392578
nll mean: 112.23729705810547 	 kl mean: 9.171380996704102 	 loss mean: 121.40867614746094
nll mean: 112.43536376953125 	 kl mean: 9.171380996704102 	 loss mean: 121.60675048828125


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.46it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 40%|████      | 4/10 [00:00<00:00, 14.59it/s][A

nll mean: 112.65446472167969 	 kl mean: 9.171380996704102 	 loss mean: 121.82585144042969
nll mean: 112.4522705078125 	 kl mean: 9.171380996704102 	 loss mean: 121.62364196777344
nll mean: 112.34915161132812 	 kl mean: 9.171380996704102 	 loss mean: 121.5205307006836


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 40%|████      | 4/10 [00:00<00:00, 14.59it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.63it/s][A

nll mean: 112.33406066894531 	 kl mean: 9.171380996704102 	 loss mean: 121.50543975830078
nll mean: 112.19711303710938 	 kl mean: 9.171380996704102 	 loss mean: 121.36849212646484
nll mean: 112.34310913085938 	 kl mean: 9.171380996704102 	 loss mean: 121.51448822021484


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.63it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.71it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               

nll mean: 112.0405502319336 	 kl mean: 9.171380996704102 	 loss mean: 121.2119369506836
nll mean: 112.2960205078125 	 kl mean: 9.171380996704102 	 loss mean: 121.46739959716797
nll mean: 80.74639892578125 	 kl mean: 8.287986755371094 	 loss mean: 89.03439331054688
nll mean: 80.88203430175781 	 kl mean: 8.287986755371094 	 loss mean: 89.17002868652344



 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 23.11it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.65it/s][A

nll mean: 80.85247802734375 	 kl mean: 8.287986755371094 	 loss mean: 89.14046478271484
nll mean: 80.46243286132812 	 kl mean: 8.287986755371094 	 loss mean: 88.75042724609375
nll mean: 81.23886108398438 	 kl mean: 8.287986755371094 	 loss mean: 89.52684020996094
nll mean: 80.88064575195312 	 kl mean: 8.287986755371094 	 loss mean: 89.16863250732422
nll mean: 81.27268981933594 	 kl mean: 8.287986755371094 	 loss mean: 89.56068420410156


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.65it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
100%|██████████| 10/10 [00:00<00:00, 21.90it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 80.96839904785156 	 kl mean: 8.287986755371094 	 loss mean: 89.25637817382812
nll mean: 81.53379821777344 	 kl mean: 8.287986755371094 	 loss mean: 89.82177734375
nll mean: 80.81794738769531 	 kl mean: 8.287986755371094 	 loss mean: 89.10592651367188
nll mean: 107.58399963378906 	 kl mean: 8.847757339477539 	 loss mean: 116.43175506591797
nll mean: 107.58306884765625 	 kl mean: 8.847757339477539 	 loss mean: 116.43083190917969


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 22.29it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.06it/s][A

nll mean: 106.50938415527344 	 kl mean: 8.847757339477539 	 loss mean: 115.35714721679688
nll mean: 106.7413330078125 	 kl mean: 8.847757339477539 	 loss mean: 115.5890884399414
nll mean: 107.75031280517578 	 kl mean: 8.847757339477539 	 loss mean: 116.59807586669922
nll mean: 107.26021575927734 	 kl mean: 8.847757339477539 	 loss mean: 116.10797119140625
nll mean: 107.04873657226562 	 kl mean: 8.847757339477539 	 loss mean: 115.89649963378906


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.06it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
100%|██████████| 10/10 [00:00<00:00, 21.67it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 107.31327819824219 	 kl mean: 8.847757339477539 	 loss mean: 116.16104125976562
nll mean: 107.40003204345703 	 kl mean: 8.847757339477539 	 loss mean: 116.24779510498047
nll mean: 107.01148986816406 	 kl mean: 8.847757339477539 	 loss mean: 115.8592529296875
nll mean: 118.18856811523438 	 kl mean: 9.741743087768555 	 loss mean: 127.9303207397461


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.19it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.19it/s][A

nll mean: 117.77079772949219 	 kl mean: 9.741743087768555 	 loss mean: 127.51253509521484
nll mean: 118.14246368408203 	 kl mean: 9.741743087768555 	 loss mean: 127.88420867919922
nll mean: 117.72467041015625 	 kl mean: 9.741743087768555 	 loss mean: 127.46641540527344


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 40%|████      | 4/10 [00:00<00:00, 12.19it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.30it/s][A

nll mean: 117.91049194335938 	 kl mean: 9.741743087768555 	 loss mean: 127.65222930908203
nll mean: 118.12716674804688 	 kl mean: 9.741743087768555 	 loss mean: 127.86891174316406
nll mean: 117.65922546386719 	 kl mean: 9.741743087768555 	 loss mean: 127.40097045898438


                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.30it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.33it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.35it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 117.59944152832031 	 kl mean: 9.741743087768555 	 loss mean: 127.3411865234375
nll mean: 118.07431030273438 	 kl mean: 9.741743087768555 	 loss mean: 127.81605529785156
nll mean: 118.16477966308594 	 kl mean: 9.741743087768555 	 loss mean: 127.90652465820312


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 10%|█         | 1/10 [00:00<00:00,  9.92it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.88it/s][A

nll mean: 60.170684814453125 	 kl mean: 10.109844207763672 	 loss mean: 70.28053283691406
nll mean: 60.79498291015625 	 kl mean: 10.109844207763672 	 loss mean: 70.90483093261719


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 20%|██        | 2/10 [00:00<00:00,  9.88it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00,  9.86it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]

nll mean: 60.59486389160156 	 kl mean: 10.109844207763672 	 loss mean: 70.70470428466797
nll mean: 61.30054473876953 	 kl mean: 10.109844207763672 	 loss mean: 71.41038513183594
nll mean: 60.06759262084961 	 kl mean: 10.109844207763672 	 loss mean: 70.17743682861328



                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 40%|████      | 4/10 [00:00<00:00,  9.89it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.90it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.88it/s][A

nll mean: 60.95555114746094 	 kl mean: 10.109844207763672 	 loss mean: 71.06539916992188
nll mean: 60.410484313964844 	 kl mean: 10.109844207763672 	 loss mean: 70.52032470703125


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.88it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s]
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s]
 80%|████████  | 8/10 [00:01<00:00,  9.91it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.97it/s]

nll mean: 60.213531494140625 	 kl mean: 10.109844207763672 	 loss mean: 70.32337188720703
nll mean: 60.767112731933594 	 kl mean: 10.109844207763672 	 loss mean: 70.87696075439453
nll mean: 60.942115783691406 	 kl mean: 10.109844207763672 	 loss mean: 71.05195617675781


100%|██████████| 10/10 [00:01<00:00,  9.92it/s]
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 20%|██        | 2/10 [00:00<00:00, 12.48it/s][A

nll mean: 102.49176025390625 	 kl mean: 9.401819229125977 	 loss mean: 111.8935775756836
nll mean: 103.80419921875 	 kl mean: 9.401819229125977 	 loss mean: 113.20601654052734
nll mean: 103.14849853515625 	 kl mean: 9.401819229125977 	 loss mean: 112.55032348632812


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 20%|██        | 2/10 [00:00<00:00, 12.48it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 40%|████      | 4/10 [00:00<00:00, 12.42it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.40it/s][A

nll mean: 102.91117858886719 	 kl mean: 9.401819229125977 	 loss mean: 112.31300354003906
nll mean: 102.75314331054688 	 kl mean: 9.401819229125977 	 loss mean: 112.15496826171875
nll mean: 102.57077026367188 	 kl mean: 9.401819229125977 	 loss mean: 111.97259521484375


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.40it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.37it/s][A

nll mean: 103.40902709960938 	 kl mean: 9.401819229125977 	 loss mean: 112.81083679199219
nll mean: 103.00497436523438 	 kl mean: 9.401819229125977 	 loss mean: 112.40679168701172
nll mean: 103.57173156738281 	 kl mean: 9.401819229125977 	 loss mean: 112.97354125976562


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.37it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.36it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.31it/s]
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:00,  9.76it/s][A

nll mean: 102.98342895507812 	 kl mean: 9.401819229125977 	 loss mean: 112.38525390625
nll mean: 135.79844665527344 	 kl mean: 10.121156692504883 	 loss mean: 145.9196014404297


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.31it/s]
 10%|█         | 1/10 [00:00<00:00,  9.76it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.31it/s]
 20%|██        | 2/10 [00:00<00:00,  9.79it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.82it/s][A

nll mean: 136.295166015625 	 kl mean: 10.121156692504883 	 loss mean: 146.41632080078125
nll mean: 135.9950714111328 	 kl mean: 10.121156692504883 	 loss mean: 146.11622619628906


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00,  9.82it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.31it/s]
 40%|████      | 4/10 [00:00<00:00,  9.85it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.87it/s][A

nll mean: 135.55413818359375 	 kl mean: 10.121156692504883 	 loss mean: 145.67529296875
nll mean: 135.5453338623047 	 kl mean: 10.121156692504883 	 loss mean: 145.66650390625


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.31it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.87it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.31it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.86it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.77it/s][A

nll mean: 135.89370727539062 	 kl mean: 10.121156692504883 	 loss mean: 146.0148468017578
nll mean: 135.8791961669922 	 kl mean: 10.121156692504883 	 loss mean: 146.00035095214844


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.31it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.77it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.31it/s]
                                               [A
 82%|████████▏ | 31/38 [00:21<00:05,  1.31it/s]
 80%|████████  | 8/10 [00:01<00:00,  9.82it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.90it/s][A

nll mean: 136.02389526367188 	 kl mean: 10.121156692504883 	 loss mean: 146.14505004882812
nll mean: 135.4920654296875 	 kl mean: 10.121156692504883 	 loss mean: 145.61322021484375
nll mean: 135.6082763671875 	 kl mean: 10.121156692504883 	 loss mean: 145.72943115234375


100%|██████████| 10/10 [00:01<00:00,  9.87it/s]
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
 30%|███       | 3/10 [00:00<00:00, 26.49it/s][A
 60%|██████    | 6/10 [00:00<00:00, 26.14it/s][A

nll mean: 62.462955474853516 	 kl mean: 8.487539291381836 	 loss mean: 70.95049285888672
nll mean: 62.39569091796875 	 kl mean: 8.487539291381836 	 loss mean: 70.88323211669922
nll mean: 62.55387878417969 	 kl mean: 8.487539291381836 	 loss mean: 71.04141235351562
nll mean: 62.64335632324219 	 kl mean: 8.487539291381836 	 loss mean: 71.13088989257812
nll mean: 62.50617980957031 	 kl mean: 8.487539291381836 	 loss mean: 70.99371337890625
nll mean: 62.937828063964844 	 kl mean: 8.487539291381836 	 loss mean: 71.42536926269531


                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
 60%|██████    | 6/10 [00:00<00:00, 26.14it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.19it/s]
100%|██████████| 10/10 [00:00<00:00, 25.68it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 62.708465576171875 	 kl mean: 8.487539291381836 	 loss mean: 71.19599914550781
nll mean: 62.84775161743164 	 kl mean: 8.487539291381836 	 loss mean: 71.33528137207031
nll mean: 62.59466552734375 	 kl mean: 8.487539291381836 	 loss mean: 71.08219909667969
nll mean: 62.53042221069336 	 kl mean: 8.487539291381836 	 loss mean: 71.01795959472656
nll mean: 116.48701477050781 	 kl mean: 8.868452072143555 	 loss mean: 125.35546875


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
 30%|███       | 3/10 [00:00<00:00, 21.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.53it/s][A

nll mean: 116.4332046508789 	 kl mean: 8.868452072143555 	 loss mean: 125.30166625976562
nll mean: 116.34854888916016 	 kl mean: 8.868452072143555 	 loss mean: 125.21699523925781
nll mean: 117.082763671875 	 kl mean: 8.868452072143555 	 loss mean: 125.95121002197266
nll mean: 116.43302154541016 	 kl mean: 8.868452072143555 	 loss mean: 125.30146789550781
nll mean: 116.47071838378906 	 kl mean: 8.868452072143555 	 loss mean: 125.33917236328125


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.53it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
100%|██████████| 10/10 [00:00<00:00, 21.42it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 116.22579956054688 	 kl mean: 8.868452072143555 	 loss mean: 125.09424591064453
nll mean: 116.46682739257812 	 kl mean: 8.868452072143555 	 loss mean: 125.33528137207031
nll mean: 116.78167724609375 	 kl mean: 8.868452072143555 	 loss mean: 125.65013122558594
nll mean: 116.94884490966797 	 kl mean: 8.868452072143555 	 loss mean: 125.81729888916016


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.08it/s][A

nll mean: 118.43811798095703 	 kl mean: 9.720561981201172 	 loss mean: 128.15867614746094
nll mean: 119.11678314208984 	 kl mean: 9.720561981201172 	 loss mean: 128.83734130859375
nll mean: 118.69059753417969 	 kl mean: 9.720561981201172 	 loss mean: 128.41116333007812


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.08it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 40%|████      | 4/10 [00:00<00:00, 12.24it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.35it/s][A

nll mean: 118.42364501953125 	 kl mean: 9.720561981201172 	 loss mean: 128.1442108154297
nll mean: 118.3932113647461 	 kl mean: 9.720561981201172 	 loss mean: 128.11378479003906
nll mean: 118.97564697265625 	 kl mean: 9.720561981201172 	 loss mean: 128.6962127685547


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.35it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.41it/s][A

nll mean: 119.15348815917969 	 kl mean: 9.720561981201172 	 loss mean: 128.87405395507812
nll mean: 118.98582458496094 	 kl mean: 9.720561981201172 	 loss mean: 128.7063751220703
nll mean: 118.95968627929688 	 kl mean: 9.720561981201172 	 loss mean: 128.6802520751953


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.41it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.49it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.51it/s][A

nll mean: 118.4013442993164 	 kl mean: 9.720561981201172 	 loss mean: 128.1219024658203
nll mean: 112.63090515136719 	 kl mean: 9.061546325683594 	 loss mean: 121.69245147705078
nll mean: 112.47714233398438 	 kl mean: 9.061546325683594 	 loss mean: 121.53868865966797


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.51it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 10.51it/s][A

nll mean: 111.60496520996094 	 kl mean: 9.061546325683594 	 loss mean: 120.66651153564453
nll mean: 112.15078735351562 	 kl mean: 9.061546325683594 	 loss mean: 121.21233367919922
nll mean: 112.0460205078125 	 kl mean: 9.061546325683594 	 loss mean: 121.1075668334961


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 10.51it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.52it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.53it/s][A

nll mean: 112.10386657714844 	 kl mean: 9.061546325683594 	 loss mean: 121.16541290283203
nll mean: 112.68186950683594 	 kl mean: 9.061546325683594 	 loss mean: 121.74341583251953
nll mean: 112.6246337890625 	 kl mean: 9.061546325683594 	 loss mean: 121.68618774414062


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.53it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.53it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 112.37266540527344 	 kl mean: 9.061546325683594 	 loss mean: 121.43421173095703
nll mean: 112.4144515991211 	 kl mean: 9.061546325683594 	 loss mean: 121.47599792480469
nll mean: 109.7215805053711 	 kl mean: 9.318066596984863 	 loss mean: 119.03964233398438
nll mean: 109.74193572998047 	 kl mean: 9.318066596984863 	 loss mean: 119.05999755859375


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 21.16it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.20it/s][A

nll mean: 109.50791931152344 	 kl mean: 9.318066596984863 	 loss mean: 118.82598114013672
nll mean: 109.93540954589844 	 kl mean: 9.318066596984863 	 loss mean: 119.25347900390625
nll mean: 110.17391204833984 	 kl mean: 9.318066596984863 	 loss mean: 119.49197387695312
nll mean: 110.32460021972656 	 kl mean: 9.318066596984863 	 loss mean: 119.64266967773438
nll mean: 110.5469970703125 	 kl mean: 9.318066596984863 	 loss mean: 119.86505889892578


                                               
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.20it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
100%|██████████| 10/10 [00:00<00:00, 21.37it/s][A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 110.3216552734375 	 kl mean: 9.318066596984863 	 loss mean: 119.63971710205078
nll mean: 109.59703063964844 	 kl mean: 9.318066596984863 	 loss mean: 118.91509246826172
nll mean: 110.32003021240234 	 kl mean: 9.318066596984863 	 loss mean: 119.63809204101562
nll mean: 84.22257995605469 	 kl mean: 10.216300964355469 	 loss mean: 94.4388656616211
nll mean: 84.44380187988281 	 kl mean: 10.216300964355469 	 loss mean: 94.66009521484375
nll mean: 83.63551330566406 	 kl mean: 10.216300964355469 	 loss mean: 93.851806640625


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 30.44it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
100%|██████████| 10/10 [00:00<00:00, 30.57it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.56it/s]


nll mean: 83.9374771118164 	 kl mean: 10.216300964355469 	 loss mean: 94.15377807617188
nll mean: 83.77699279785156 	 kl mean: 10.216300964355469 	 loss mean: 93.9932861328125
nll mean: 84.28195190429688 	 kl mean: 10.216300964355469 	 loss mean: 94.49825286865234
nll mean: 84.32229614257812 	 kl mean: 10.216300964355469 	 loss mean: 94.5385971069336
nll mean: 83.22136688232422 	 kl mean: 10.216300964355469 	 loss mean: 93.43766784667969
nll mean: 83.55787658691406 	 kl mean: 10.216300964355469 	 loss mean: 93.774169921875
nll mean: 83.73751068115234 	 kl mean: 10.216300964355469 	 loss mean: 93.95381927490234
Approximate NLL:
tensor(119.5421, device='cuda:0')
Approximate KL:
tensor(9.5691, device='cuda:0')
Testing took 0:00:25.403366


In [19]:
print(mdr_nlls)

[tensor(119.7677, device='cuda:0'), tensor(119.8687, device='cuda:0'), tensor(120.0548, device='cuda:0'), tensor(119.5421, device='cuda:0')]


# Word dropout & Free Bits

In [20]:
saved_model_files = get_model_filenames('word_dropout_066_freebits_05')
saved_model_files

['results_final/results0/word_dropout_066_freebits_05/models/sentence_vae_FreeBits_0.5_4500.pt',
 'results_final/results1/word_dropout_066_freebits_05/models/sentence_vae_FreeBits_0.5_6000.pt',
 'results_final/results2/word_dropout_066_freebits_05/models/sentence_vae_FreeBits_0.5_6000.pt',
 'results_final/results3/word_dropout_066_freebits_05/models/sentence_vae_FreeBits_0.5_7000.pt']

In [21]:
wd_fb_nlls, wd_fb_kls = get_approx_nlls(saved_model_files)

  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .63it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .63it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.63it/s][A

nll mean: 109.65031433105469 	 kl mean: 9.060304641723633 	 loss mean: 118.71061706542969
nll mean: 109.71214294433594 	 kl mean: 9.060304641723633 	 loss mean: 118.77245330810547
nll mean: 109.27368927001953 	 kl mean: 9.060304641723633 	 loss mean: 118.33399963378906
nll mean: 109.56234741210938 	 kl mean: 9.060304641723633 	 loss mean: 118.6226577758789
nll mean: 109.4615707397461 	 kl mean: 9.060304641723633 	 loss mean: 118.52188110351562


                                      
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.63it/s][A
                                      .35it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .35it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .35it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 25.35it/s][A
                                      .12it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 24.90it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 109.34209442138672 	 kl mean: 9.060304641723633 	 loss mean: 118.40240478515625
nll mean: 110.34087371826172 	 kl mean: 9.060304641723633 	 loss mean: 119.40116882324219
nll mean: 110.13851928710938 	 kl mean: 9.060304641723633 	 loss mean: 119.19882202148438
nll mean: 109.74661254882812 	 kl mean: 9.060304641723633 	 loss mean: 118.80691528320312
nll mean: 109.78779602050781 	 kl mean: 9.060304641723633 	 loss mean: 118.84811401367188


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
 20%|██        | 2/10 [00:00<00:00, 13.29it/s][A

nll mean: 127.0489501953125 	 kl mean: 8.866565704345703 	 loss mean: 135.91552734375
nll mean: 126.62678527832031 	 kl mean: 8.866565704345703 	 loss mean: 135.49334716796875
nll mean: 127.33262634277344 	 kl mean: 8.866565704345703 	 loss mean: 136.19918823242188


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
 20%|██        | 2/10 [00:00<00:00, 13.29it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
 40%|████      | 4/10 [00:00<00:00, 13.71it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.86it/s][A

nll mean: 127.48977661132812 	 kl mean: 8.866565704345703 	 loss mean: 136.35635375976562
nll mean: 126.95492553710938 	 kl mean: 8.866565704345703 	 loss mean: 135.82150268554688
nll mean: 127.76414489746094 	 kl mean: 8.866565704345703 	 loss mean: 136.63070678710938


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.86it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.90it/s][A

nll mean: 127.01155853271484 	 kl mean: 8.866565704345703 	 loss mean: 135.8781280517578
nll mean: 127.23216247558594 	 kl mean: 8.866565704345703 	 loss mean: 136.09872436523438
nll mean: 127.66414642333984 	 kl mean: 8.866565704345703 	 loss mean: 136.53070068359375


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.90it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.15it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
 30%|███       | 3/10 [00:00<00:00, 24.44it/s][A

nll mean: 127.07752990722656 	 kl mean: 8.866565704345703 	 loss mean: 135.944091796875
nll mean: 99.23391723632812 	 kl mean: 8.433399200439453 	 loss mean: 107.66732025146484
nll mean: 99.888671875 	 kl mean: 8.433399200439453 	 loss mean: 108.32207489013672
nll mean: 99.75325012207031 	 kl mean: 8.433399200439453 	 loss mean: 108.1866455078125
nll mean: 99.91557312011719 	 kl mean: 8.433399200439453 	 loss mean: 108.34896850585938


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
 30%|███       | 3/10 [00:00<00:00, 24.44it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.43it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.27it/s][A

nll mean: 99.77726745605469 	 kl mean: 8.433399200439453 	 loss mean: 108.21067810058594
nll mean: 99.60249328613281 	 kl mean: 8.433399200439453 	 loss mean: 108.03590393066406
nll mean: 99.52083587646484 	 kl mean: 8.433399200439453 	 loss mean: 107.95423889160156
nll mean: 99.6619644165039 	 kl mean: 8.433399200439453 	 loss mean: 108.0953598022461
nll mean: 99.55589294433594 	 kl mean: 8.433399200439453 	 loss mean: 107.98928833007812


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
100%|██████████| 10/10 [00:00<00:00, 24.28it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.79it/s][A

nll mean: 99.71133422851562 	 kl mean: 8.433399200439453 	 loss mean: 108.14472961425781
nll mean: 139.82785034179688 	 kl mean: 8.302433967590332 	 loss mean: 148.13027954101562
nll mean: 139.52099609375 	 kl mean: 8.302433967590332 	 loss mean: 147.82342529296875


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
 20%|██        | 2/10 [00:00<00:00, 10.79it/s][A
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
 40%|████      | 4/10 [00:00<00:00, 10.82it/s][A

nll mean: 139.6184539794922 	 kl mean: 8.302433967590332 	 loss mean: 147.92088317871094
nll mean: 139.58444213867188 	 kl mean: 8.302433967590332 	 loss mean: 147.88687133789062
nll mean: 139.83349609375 	 kl mean: 8.302433967590332 	 loss mean: 148.13592529296875


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
 40%|████      | 4/10 [00:00<00:00, 10.82it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.82it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.81it/s][A

nll mean: 139.49252319335938 	 kl mean: 8.302433967590332 	 loss mean: 147.79495239257812
nll mean: 139.618408203125 	 kl mean: 8.302433967590332 	 loss mean: 147.9208526611328
nll mean: 139.59561157226562 	 kl mean: 8.302433967590332 	 loss mean: 147.8980712890625


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.81it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.82it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 139.8710174560547 	 kl mean: 8.302433967590332 	 loss mean: 148.17344665527344
nll mean: 139.7892608642578 	 kl mean: 8.302433967590332 	 loss mean: 148.09170532226562
nll mean: 125.80535888671875 	 kl mean: 8.149118423461914 	 loss mean: 133.95448303222656


                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.43it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.47it/s][A

nll mean: 126.03449249267578 	 kl mean: 8.149118423461914 	 loss mean: 134.18360900878906
nll mean: 125.82156372070312 	 kl mean: 8.149118423461914 	 loss mean: 133.97068786621094
nll mean: 125.17552947998047 	 kl mean: 8.149118423461914 	 loss mean: 133.32464599609375


                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
 40%|████      | 4/10 [00:00<00:00, 14.47it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.29it/s][A

nll mean: 126.48310089111328 	 kl mean: 8.149118423461914 	 loss mean: 134.63221740722656
nll mean: 125.50846099853516 	 kl mean: 8.149118423461914 	 loss mean: 133.65757751464844
nll mean: 125.61861419677734 	 kl mean: 8.149118423461914 	 loss mean: 133.76773071289062


                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.29it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.65it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.65it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.40it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.21it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 125.83395385742188 	 kl mean: 8.149118423461914 	 loss mean: 133.98306274414062
nll mean: 125.89393615722656 	 kl mean: 8.149118423461914 	 loss mean: 134.04302978515625
nll mean: 126.14138793945312 	 kl mean: 8.149118423461914 	 loss mean: 134.29049682617188


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 14.76it/s][A

nll mean: 123.30656433105469 	 kl mean: 8.1809720993042 	 loss mean: 131.48753356933594
nll mean: 123.38065338134766 	 kl mean: 8.1809720993042 	 loss mean: 131.56161499023438
nll mean: 123.28800964355469 	 kl mean: 8.1809720993042 	 loss mean: 131.46896362304688


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 14.76it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 40%|████      | 4/10 [00:00<00:00, 14.58it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.41it/s][A

nll mean: 123.50597381591797 	 kl mean: 8.1809720993042 	 loss mean: 131.68695068359375
nll mean: 123.37640380859375 	 kl mean: 8.1809720993042 	 loss mean: 131.557373046875
nll mean: 123.45170593261719 	 kl mean: 8.1809720993042 	 loss mean: 131.63267517089844


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.41it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.21it/s][A

nll mean: 123.15696716308594 	 kl mean: 8.1809720993042 	 loss mean: 131.3379364013672
nll mean: 123.47340393066406 	 kl mean: 8.1809720993042 	 loss mean: 131.6543731689453
nll mean: 123.52770233154297 	 kl mean: 8.1809720993042 	 loss mean: 131.70867919921875


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.21it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.11it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 24.67it/s][A

nll mean: 123.35198974609375 	 kl mean: 8.1809720993042 	 loss mean: 131.532958984375
nll mean: 133.47384643554688 	 kl mean: 8.186443328857422 	 loss mean: 141.6602783203125
nll mean: 134.1564178466797 	 kl mean: 8.186443328857422 	 loss mean: 142.34286499023438
nll mean: 134.26348876953125 	 kl mean: 8.186443328857422 	 loss mean: 142.44992065429688
nll mean: 133.10592651367188 	 kl mean: 8.186443328857422 	 loss mean: 141.29238891601562


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 30%|███       | 3/10 [00:00<00:00, 24.67it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.76it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.73it/s][A

nll mean: 133.9973907470703 	 kl mean: 8.186443328857422 	 loss mean: 142.18382263183594
nll mean: 133.85438537597656 	 kl mean: 8.186443328857422 	 loss mean: 142.0408172607422
nll mean: 133.56317138671875 	 kl mean: 8.186443328857422 	 loss mean: 141.74960327148438
nll mean: 133.772216796875 	 kl mean: 8.186443328857422 	 loss mean: 141.95864868164062
nll mean: 133.5289306640625 	 kl mean: 8.186443328857422 	 loss mean: 141.71536254882812


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.52it/s]
100%|██████████| 10/10 [00:00<00:00, 24.74it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 24.92it/s][A

nll mean: 134.02224731445312 	 kl mean: 8.186443328857422 	 loss mean: 142.20867919921875
nll mean: 107.38987731933594 	 kl mean: 8.098248481750488 	 loss mean: 115.48812866210938
nll mean: 106.85624694824219 	 kl mean: 8.098248481750488 	 loss mean: 114.9544906616211
nll mean: 106.6228256225586 	 kl mean: 8.098248481750488 	 loss mean: 114.7210693359375
nll mean: 107.12289428710938 	 kl mean: 8.098248481750488 	 loss mean: 115.22113800048828


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 24.92it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.83it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.77it/s][A

nll mean: 106.95870208740234 	 kl mean: 8.098248481750488 	 loss mean: 115.05695343017578
nll mean: 106.42789459228516 	 kl mean: 8.098248481750488 	 loss mean: 114.5261459350586
nll mean: 106.87117767333984 	 kl mean: 8.098248481750488 	 loss mean: 114.96942901611328
nll mean: 106.98696899414062 	 kl mean: 8.098248481750488 	 loss mean: 115.085205078125
nll mean: 107.42402648925781 	 kl mean: 8.098248481750488 	 loss mean: 115.52227783203125


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
100%|██████████| 10/10 [00:00<00:00, 24.70it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.15it/s][A

nll mean: 107.5251693725586 	 kl mean: 8.098248481750488 	 loss mean: 115.62342071533203
nll mean: 132.62063598632812 	 kl mean: 8.698883056640625 	 loss mean: 141.31951904296875
nll mean: 132.45193481445312 	 kl mean: 8.698883056640625 	 loss mean: 141.15081787109375


                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
 20%|██        | 2/10 [00:00<00:00, 14.15it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 40%|████      | 4/10 [00:00<00:00, 14.53it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.76it/s][A

nll mean: 133.29922485351562 	 kl mean: 8.698883056640625 	 loss mean: 141.99810791015625
nll mean: 132.87271118164062 	 kl mean: 8.698883056640625 	 loss mean: 141.57159423828125
nll mean: 132.13186645507812 	 kl mean: 8.698883056640625 	 loss mean: 140.83074951171875
nll mean: 132.99366760253906 	 kl mean: 8.698883056640625 	 loss mean: 141.6925506591797


                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.76it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.44it/s][A

nll mean: 132.26983642578125 	 kl mean: 8.698883056640625 	 loss mean: 140.96871948242188
nll mean: 132.36746215820312 	 kl mean: 8.698883056640625 	 loss mean: 141.06634521484375
nll mean: 132.9031524658203 	 kl mean: 8.698883056640625 	 loss mean: 141.60202026367188


                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.44it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.75it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 22.31it/s][A

nll mean: 132.4739532470703 	 kl mean: 8.698883056640625 	 loss mean: 141.17283630371094
nll mean: 132.26092529296875 	 kl mean: 8.520872116088867 	 loss mean: 140.7818145751953
nll mean: 132.14523315429688 	 kl mean: 8.520872116088867 	 loss mean: 140.6660919189453
nll mean: 132.70396423339844 	 kl mean: 8.520872116088867 	 loss mean: 141.22483825683594
nll mean: 132.41976928710938 	 kl mean: 8.520872116088867 	 loss mean: 140.9406280517578


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 22.31it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.86it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.64it/s][A

nll mean: 132.26023864746094 	 kl mean: 8.520872116088867 	 loss mean: 140.78111267089844
nll mean: 131.94715881347656 	 kl mean: 8.520872116088867 	 loss mean: 140.46803283691406
nll mean: 132.532958984375 	 kl mean: 8.520872116088867 	 loss mean: 141.0538330078125
nll mean: 132.68789672851562 	 kl mean: 8.520872116088867 	 loss mean: 141.20877075195312
nll mean: 131.76681518554688 	 kl mean: 8.520872116088867 	 loss mean: 140.2876739501953


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
100%|██████████| 10/10 [00:00<00:00, 21.27it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 30%|███       | 3/10 [00:00<00:00, 24.89it/s][A

nll mean: 132.54983520507812 	 kl mean: 8.520872116088867 	 loss mean: 141.07070922851562
nll mean: 120.08639526367188 	 kl mean: 8.601173400878906 	 loss mean: 128.68756103515625
nll mean: 120.56644439697266 	 kl mean: 8.601173400878906 	 loss mean: 129.16763305664062
nll mean: 120.37833404541016 	 kl mean: 8.601173400878906 	 loss mean: 128.97952270507812
nll mean: 120.41221618652344 	 kl mean: 8.601173400878906 	 loss mean: 129.0133819580078


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 30%|███       | 3/10 [00:00<00:00, 24.89it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.76it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.49it/s][A

nll mean: 120.66726684570312 	 kl mean: 8.601173400878906 	 loss mean: 129.2684326171875
nll mean: 120.76437377929688 	 kl mean: 8.601173400878906 	 loss mean: 129.3655548095703
nll mean: 120.71536254882812 	 kl mean: 8.601173400878906 	 loss mean: 129.31654357910156
nll mean: 120.01502227783203 	 kl mean: 8.601173400878906 	 loss mean: 128.6162109375
nll mean: 120.19759368896484 	 kl mean: 8.601173400878906 	 loss mean: 128.79876708984375


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
100%|██████████| 10/10 [00:00<00:00, 24.05it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
 30%|███       | 3/10 [00:00<00:00, 20.98it/s][A

nll mean: 120.76213073730469 	 kl mean: 8.601173400878906 	 loss mean: 129.36329650878906
nll mean: 143.37753295898438 	 kl mean: 8.733118057250977 	 loss mean: 152.11065673828125
nll mean: 142.634033203125 	 kl mean: 8.733118057250977 	 loss mean: 151.36715698242188
nll mean: 142.4202880859375 	 kl mean: 8.733118057250977 	 loss mean: 151.15341186523438
nll mean: 142.7081756591797 	 kl mean: 8.733118057250977 	 loss mean: 151.44129943847656


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
 30%|███       | 3/10 [00:00<00:00, 20.98it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.16it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.04it/s][A

nll mean: 142.67831420898438 	 kl mean: 8.733118057250977 	 loss mean: 151.41140747070312
nll mean: 142.80722045898438 	 kl mean: 8.733118057250977 	 loss mean: 151.54034423828125
nll mean: 142.3827362060547 	 kl mean: 8.733118057250977 	 loss mean: 151.1158447265625
nll mean: 143.2147674560547 	 kl mean: 8.733118057250977 	 loss mean: 151.94789123535156
nll mean: 142.51040649414062 	 kl mean: 8.733118057250977 	 loss mean: 151.24351501464844


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
100%|██████████| 10/10 [00:00<00:00, 21.11it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.77it/s][A

nll mean: 142.78648376464844 	 kl mean: 8.733118057250977 	 loss mean: 151.5196075439453
nll mean: 120.3409423828125 	 kl mean: 9.070718765258789 	 loss mean: 129.4116668701172
nll mean: 120.98707580566406 	 kl mean: 9.070718765258789 	 loss mean: 130.0577850341797


                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
 20%|██        | 2/10 [00:00<00:00, 12.77it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
 40%|████      | 4/10 [00:00<00:00, 12.78it/s][A

nll mean: 120.35831451416016 	 kl mean: 9.070718765258789 	 loss mean: 129.42904663085938
nll mean: 120.04310607910156 	 kl mean: 9.070718765258789 	 loss mean: 129.11383056640625
nll mean: 120.33183288574219 	 kl mean: 9.070718765258789 	 loss mean: 129.40255737304688


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
 40%|████      | 4/10 [00:00<00:00, 12.78it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.59it/s][A

nll mean: 120.29354858398438 	 kl mean: 9.070718765258789 	 loss mean: 129.36427307128906
nll mean: 120.23042297363281 	 kl mean: 9.070718765258789 	 loss mean: 129.3011474609375
nll mean: 120.01370239257812 	 kl mean: 9.070718765258789 	 loss mean: 129.0844268798828


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.59it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.51it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.05736541748047 	 kl mean: 9.070718765258789 	 loss mean: 129.12808227539062
nll mean: 120.50225830078125 	 kl mean: 9.070718765258789 	 loss mean: 129.57296752929688
nll mean: 160.40771484375 	 kl mean: 9.072799682617188 	 loss mean: 169.4805145263672


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
                                               [A
                                              

nll mean: 160.54002380371094 	 kl mean: 9.072799682617188 	 loss mean: 169.61282348632812
nll mean: 160.95358276367188 	 kl mean: 9.072799682617188 	 loss mean: 170.0263671875


 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
 20%|██        | 2/10 [00:00<00:00,  9.86it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 40%|████      | 4/10 [00:00<00:00,  9.89it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.87it/s][A

nll mean: 160.61199951171875 	 kl mean: 9.072799682617188 	 loss mean: 169.684814453125
nll mean: 160.49038696289062 	 kl mean: 9.072799682617188 	 loss mean: 169.5631866455078


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.87it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.83it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.86it/s][A

nll mean: 160.7002716064453 	 kl mean: 9.072799682617188 	 loss mean: 169.7730712890625
nll mean: 161.0149383544922 	 kl mean: 9.072799682617188 	 loss mean: 170.08773803710938
nll mean: 161.117919921875 	 kl mean: 9.072799682617188 	 loss mean: 170.19070434570312


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.86it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.91it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.89it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 161.72882080078125 	 kl mean: 9.072799682617188 	 loss mean: 170.80160522460938
nll mean: 161.09719848632812 	 kl mean: 9.072799682617188 	 loss mean: 170.17001342773438
nll mean: 135.14215087890625 	 kl mean: 8.038087844848633 	 loss mean: 143.18023681640625


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 17.77it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 17.65it/s][A

nll mean: 135.65248107910156 	 kl mean: 8.038087844848633 	 loss mean: 143.69058227539062
nll mean: 135.5816650390625 	 kl mean: 8.038087844848633 	 loss mean: 143.61976623535156
nll mean: 135.5567626953125 	 kl mean: 8.038087844848633 	 loss mean: 143.5948486328125
nll mean: 135.47073364257812 	 kl mean: 8.038087844848633 	 loss mean: 143.50881958007812


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 17.65it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 17.58it/s][A
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 17.49it/s][A

nll mean: 136.03021240234375 	 kl mean: 8.038087844848633 	 loss mean: 144.06829833984375
nll mean: 135.47366333007812 	 kl mean: 8.038087844848633 	 loss mean: 143.51174926757812
nll mean: 135.41525268554688 	 kl mean: 8.038087844848633 	 loss mean: 143.45333862304688
nll mean: 135.41839599609375 	 kl mean: 8.038087844848633 	 loss mean: 143.45648193359375


                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 17.49it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.45it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.49it/s][A

nll mean: 135.3960418701172 	 kl mean: 8.038087844848633 	 loss mean: 143.4341278076172
nll mean: 143.1465301513672 	 kl mean: 8.635129928588867 	 loss mean: 151.7816619873047
nll mean: 143.62069702148438 	 kl mean: 8.635129928588867 	 loss mean: 152.2558135986328


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 10.49it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 10.58it/s][A

nll mean: 143.0992431640625 	 kl mean: 8.635129928588867 	 loss mean: 151.734375
nll mean: 142.32763671875 	 kl mean: 8.635129928588867 	 loss mean: 150.9627685546875
nll mean: 142.91482543945312 	 kl mean: 8.635129928588867 	 loss mean: 151.54995727539062


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 10.58it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.67it/s][A

nll mean: 142.57469177246094 	 kl mean: 8.635129928588867 	 loss mean: 151.20982360839844
nll mean: 142.98399353027344 	 kl mean: 8.635129928588867 	 loss mean: 151.61912536621094
nll mean: 142.75772094726562 	 kl mean: 8.635129928588867 	 loss mean: 151.39283752441406


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
                                               [A
 39%|███▉      | 15/38 [00:10<00:15,  1.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.67it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.66it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 142.49191284179688 	 kl mean: 8.635129928588867 	 loss mean: 151.12704467773438
nll mean: 142.8660430908203 	 kl mean: 8.635129928588867 	 loss mean: 151.5011749267578
nll mean: 144.3892822265625 	 kl mean: 7.6593523025512695 	 loss mean: 152.04861450195312
nll mean: 144.22447204589844 	 kl mean: 7.6593523025512695 	 loss mean: 151.88381958007812


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 24.56it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.52it/s][A

nll mean: 144.78060913085938 	 kl mean: 7.6593523025512695 	 loss mean: 152.43997192382812
nll mean: 144.73770141601562 	 kl mean: 7.6593523025512695 	 loss mean: 152.3970489501953
nll mean: 144.6087646484375 	 kl mean: 7.6593523025512695 	 loss mean: 152.2681121826172
nll mean: 144.5121612548828 	 kl mean: 7.6593523025512695 	 loss mean: 152.1715087890625
nll mean: 144.2200164794922 	 kl mean: 7.6593523025512695 	 loss mean: 151.87936401367188


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.52it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
100%|██████████| 10/10 [00:00<00:00, 24.49it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 144.06655883789062 	 kl mean: 7.6593523025512695 	 loss mean: 151.72592163085938
nll mean: 145.00575256347656 	 kl mean: 7.6593523025512695 	 loss mean: 152.66510009765625
nll mean: 144.203857421875 	 kl mean: 7.6593523025512695 	 loss mean: 151.86322021484375
nll mean: 133.80943298339844 	 kl mean: 8.208298683166504 	 loss mean: 142.01773071289062
nll mean: 133.87155151367188 	 kl mean: 8.208298683166504 	 loss mean: 142.07986450195312


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 30%|███       | 3/10 [00:00<00:00, 24.83it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.82it/s][A

nll mean: 133.30076599121094 	 kl mean: 8.208298683166504 	 loss mean: 141.50904846191406
nll mean: 133.46054077148438 	 kl mean: 8.208298683166504 	 loss mean: 141.66885375976562
nll mean: 133.7640380859375 	 kl mean: 8.208298683166504 	 loss mean: 141.97235107421875
nll mean: 133.52056884765625 	 kl mean: 8.208298683166504 	 loss mean: 141.72886657714844
nll mean: 133.88575744628906 	 kl mean: 8.208298683166504 	 loss mean: 142.09405517578125


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.82it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
100%|██████████| 10/10 [00:00<00:00, 24.60it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 133.296875 	 kl mean: 8.208298683166504 	 loss mean: 141.50518798828125
nll mean: 134.1588134765625 	 kl mean: 8.208298683166504 	 loss mean: 142.36709594726562
nll mean: 133.5968017578125 	 kl mean: 8.208298683166504 	 loss mean: 141.80511474609375
nll mean: 130.03489685058594 	 kl mean: 9.11074447631836 	 loss mean: 139.14564514160156


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 20%|██        | 2/10 [00:00<00:00, 12.00it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.11it/s][A

nll mean: 130.95590209960938 	 kl mean: 9.11074447631836 	 loss mean: 140.06663513183594
nll mean: 130.52102661132812 	 kl mean: 9.11074447631836 	 loss mean: 139.63177490234375
nll mean: 130.23728942871094 	 kl mean: 9.11074447631836 	 loss mean: 139.34803771972656


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 40%|████      | 4/10 [00:00<00:00, 12.11it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.26it/s][A

nll mean: 130.36082458496094 	 kl mean: 9.11074447631836 	 loss mean: 139.4715576171875
nll mean: 129.98101806640625 	 kl mean: 9.11074447631836 	 loss mean: 139.09176635742188
nll mean: 129.87367248535156 	 kl mean: 9.11074447631836 	 loss mean: 138.9844207763672


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.26it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.42it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.52it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 130.0504150390625 	 kl mean: 9.11074447631836 	 loss mean: 139.16116333007812
nll mean: 130.11727905273438 	 kl mean: 9.11074447631836 	 loss mean: 139.22801208496094
nll mean: 130.095458984375 	 kl mean: 9.11074447631836 	 loss mean: 139.20619201660156


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 12.79it/s][A

nll mean: 147.71347045898438 	 kl mean: 8.750589370727539 	 loss mean: 156.46408081054688
nll mean: 148.52928161621094 	 kl mean: 8.750589370727539 	 loss mean: 157.27987670898438
nll mean: 148.16250610351562 	 kl mean: 8.750589370727539 	 loss mean: 156.91310119628906


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 12.79it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 40%|████      | 4/10 [00:00<00:00, 12.71it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.51it/s][A

nll mean: 148.53271484375 	 kl mean: 8.750589370727539 	 loss mean: 157.28330993652344
nll mean: 148.84759521484375 	 kl mean: 8.750589370727539 	 loss mean: 157.59820556640625
nll mean: 148.5077667236328 	 kl mean: 8.750589370727539 	 loss mean: 157.25836181640625


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.51it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A

nll mean: 147.97763061523438 	 kl mean: 8.750589370727539 	 loss mean: 156.72821044921875
nll mean: 148.49691772460938 	 kl mean: 8.750589370727539 	 loss mean: 157.2475128173828
nll mean: 148.35369873046875 	 kl mean: 8.750589370727539 	 loss mean: 157.1042938232422


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.46it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.55it/s][A

nll mean: 148.3016815185547 	 kl mean: 8.750589370727539 	 loss mean: 157.05227661132812
nll mean: 155.86351013183594 	 kl mean: 8.323749542236328 	 loss mean: 164.187255859375
nll mean: 155.6365509033203 	 kl mean: 8.323749542236328 	 loss mean: 163.96029663085938


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 20%|██        | 2/10 [00:00<00:00, 12.55it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 40%|████      | 4/10 [00:00<00:00, 12.46it/s][A

nll mean: 155.9458770751953 	 kl mean: 8.323749542236328 	 loss mean: 164.26962280273438
nll mean: 155.6334991455078 	 kl mean: 8.323749542236328 	 loss mean: 163.95724487304688
nll mean: 155.30992126464844 	 kl mean: 8.323749542236328 	 loss mean: 163.6336669921875


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 40%|████      | 4/10 [00:00<00:00, 12.46it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.47it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.46it/s][A

nll mean: 155.91342163085938 	 kl mean: 8.323749542236328 	 loss mean: 164.2371826171875
nll mean: 155.5262451171875 	 kl mean: 8.323749542236328 	 loss mean: 163.85000610351562
nll mean: 155.91165161132812 	 kl mean: 8.323749542236328 	 loss mean: 164.2353973388672


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.45it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 154.87857055664062 	 kl mean: 8.323749542236328 	 loss mean: 163.2023162841797
nll mean: 155.41165161132812 	 kl mean: 8.323749542236328 	 loss mean: 163.7353973388672
nll mean: 118.57913208007812 	 kl mean: 8.873592376708984 	 loss mean: 127.45272827148438


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 10.28it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.28it/s][A

nll mean: 119.10442352294922 	 kl mean: 8.873592376708984 	 loss mean: 127.97801971435547
nll mean: 119.01081085205078 	 kl mean: 8.873592376708984 	 loss mean: 127.88441467285156
nll mean: 119.16731262207031 	 kl mean: 8.873592376708984 	 loss mean: 128.04090881347656


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
 40%|████      | 4/10 [00:00<00:00, 10.28it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.25it/s]

nll mean: 118.90275573730469 	 kl mean: 8.873592376708984 	 loss mean: 127.77635192871094
nll mean: 118.24246215820312 	 kl mean: 8.873592376708984 	 loss mean: 127.11605834960938
nll mean: 118.4613037109375 	 kl mean: 8.873592376708984 	 loss mean: 127.33489227294922


[A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.14it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s]
100%|██████████| 10/10 [00:00<00:00, 10.20it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.71858978271484 	 kl mean: 8.873592376708984 	 loss mean: 127.59217834472656
nll mean: 118.83412170410156 	 kl mean: 8.873592376708984 	 loss mean: 127.70771789550781
nll mean: 118.70150756835938 	 kl mean: 8.873592376708984 	 loss mean: 127.57510375976562


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
 40%|████      | 4/10 [00:00<00:00, 33.28it/s][A

nll mean: 106.06861877441406 	 kl mean: 7.537116050720215 	 loss mean: 113.6057357788086
nll mean: 105.90813446044922 	 kl mean: 7.537116050720215 	 loss mean: 113.44525146484375
nll mean: 106.41204833984375 	 kl mean: 7.537116050720215 	 loss mean: 113.94915771484375
nll mean: 106.9678955078125 	 kl mean: 7.537116050720215 	 loss mean: 114.50501251220703
nll mean: 106.17781829833984 	 kl mean: 7.537116050720215 	 loss mean: 113.71493530273438
nll mean: 106.49723815917969 	 kl mean: 7.537116050720215 	 loss mean: 114.03435516357422
nll mean: 106.48049926757812 	 kl mean: 7.537116050720215 	 loss mean: 114.01761627197266


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
 40%|████      | 4/10 [00:00<00:00, 33.28it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
100%|██████████| 10/10 [00:00<00:00, 32.61it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 106.28488159179688 	 kl mean: 7.537116050720215 	 loss mean: 113.8219985961914
nll mean: 106.24364471435547 	 kl mean: 7.537116050720215 	 loss mean: 113.78075408935547
nll mean: 106.37380981445312 	 kl mean: 7.537116050720215 	 loss mean: 113.91092681884766
nll mean: 158.15252685546875 	 kl mean: 8.180444717407227 	 loss mean: 166.3329620361328


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.50it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.56it/s][A

nll mean: 158.5224151611328 	 kl mean: 8.180444717407227 	 loss mean: 166.70286560058594
nll mean: 158.18572998046875 	 kl mean: 8.180444717407227 	 loss mean: 166.3661651611328
nll mean: 157.98031616210938 	 kl mean: 8.180444717407227 	 loss mean: 166.1607666015625


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 40%|████      | 4/10 [00:00<00:00, 14.56it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.61it/s][A

nll mean: 158.428466796875 	 kl mean: 8.180444717407227 	 loss mean: 166.60891723632812
nll mean: 157.8385467529297 	 kl mean: 8.180444717407227 	 loss mean: 166.0189971923828
nll mean: 157.908447265625 	 kl mean: 8.180444717407227 	 loss mean: 166.08889770507812


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.61it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.60it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.59it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 157.98312377929688 	 kl mean: 8.180444717407227 	 loss mean: 166.16355895996094
nll mean: 158.0204620361328 	 kl mean: 8.180444717407227 	 loss mean: 166.20089721679688
nll mean: 158.7371826171875 	 kl mean: 8.180444717407227 	 loss mean: 166.91763305664062
nll mean: 120.31005859375 	 kl mean: 9.114471435546875 	 loss mean: 129.42453002929688


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
 30%|███       | 3/10 [00:00<00:00, 21.68it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.52it/s][A

nll mean: 120.7618179321289 	 kl mean: 9.114471435546875 	 loss mean: 129.87628173828125
nll mean: 121.57295989990234 	 kl mean: 9.114471435546875 	 loss mean: 130.68743896484375
nll mean: 121.07298278808594 	 kl mean: 9.114471435546875 	 loss mean: 130.1874542236328
nll mean: 121.21347045898438 	 kl mean: 9.114471435546875 	 loss mean: 130.32794189453125
nll mean: 121.2471923828125 	 kl mean: 9.114471435546875 	 loss mean: 130.36166381835938


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.52it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
100%|██████████| 10/10 [00:00<00:00, 21.35it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 121.39762878417969 	 kl mean: 9.114471435546875 	 loss mean: 130.51210021972656
nll mean: 121.59771728515625 	 kl mean: 9.114471435546875 	 loss mean: 130.71218872070312
nll mean: 122.00392150878906 	 kl mean: 9.114471435546875 	 loss mean: 131.11837768554688
nll mean: 120.72413635253906 	 kl mean: 9.114471435546875 	 loss mean: 129.83860778808594


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.72it/s][A

nll mean: 116.7447509765625 	 kl mean: 7.90917444229126 	 loss mean: 124.65391540527344
nll mean: 115.78414916992188 	 kl mean: 7.90917444229126 	 loss mean: 123.69332122802734
nll mean: 115.94461822509766 	 kl mean: 7.90917444229126 	 loss mean: 123.85379028320312


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.72it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 40%|████      | 4/10 [00:00<00:00, 14.77it/s][A
                                               [A
                                              

nll mean: 116.18033599853516 	 kl mean: 7.90917444229126 	 loss mean: 124.08952331542969
nll mean: 116.07722473144531 	 kl mean: 7.90917444229126 	 loss mean: 123.98640441894531
nll mean: 115.87274932861328 	 kl mean: 7.90917444229126 	 loss mean: 123.78192901611328


 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.85it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.84it/s][A

nll mean: 116.2328872680664 	 kl mean: 7.90917444229126 	 loss mean: 124.14205932617188
nll mean: 116.12828826904297 	 kl mean: 7.90917444229126 	 loss mean: 124.03746032714844
nll mean: 116.21306610107422 	 kl mean: 7.90917444229126 	 loss mean: 124.12223815917969


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.84it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.82it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 21.84it/s][A

nll mean: 116.07157135009766 	 kl mean: 7.90917444229126 	 loss mean: 123.98074340820312
nll mean: 82.41139221191406 	 kl mean: 7.691121578216553 	 loss mean: 90.10250854492188
nll mean: 82.36071014404297 	 kl mean: 7.691121578216553 	 loss mean: 90.05183410644531
nll mean: 82.5587387084961 	 kl mean: 7.691121578216553 	 loss mean: 90.24986267089844
nll mean: 82.62504577636719 	 kl mean: 7.691121578216553 	 loss mean: 90.316162109375


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 21.84it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.78it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.88it/s][A

nll mean: 82.86029052734375 	 kl mean: 7.691121578216553 	 loss mean: 90.5514144897461
nll mean: 82.56755065917969 	 kl mean: 7.691121578216553 	 loss mean: 90.2586669921875
nll mean: 82.23600006103516 	 kl mean: 7.691121578216553 	 loss mean: 89.9271240234375
nll mean: 81.92228698730469 	 kl mean: 7.691121578216553 	 loss mean: 89.61341094970703
nll mean: 82.39598846435547 	 kl mean: 7.691121578216553 	 loss mean: 90.08711242675781


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
100%|██████████| 10/10 [00:00<00:00, 21.82it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 22.27it/s][A

nll mean: 82.43880462646484 	 kl mean: 7.691121578216553 	 loss mean: 90.12992858886719
nll mean: 108.52923583984375 	 kl mean: 7.603417873382568 	 loss mean: 116.13265228271484
nll mean: 108.4811782836914 	 kl mean: 7.603417873382568 	 loss mean: 116.0845947265625
nll mean: 108.28474426269531 	 kl mean: 7.603417873382568 	 loss mean: 115.88816833496094
nll mean: 108.66476440429688 	 kl mean: 7.603417873382568 	 loss mean: 116.26818084716797


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 22.27it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.06it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.77it/s][A

nll mean: 108.54305267333984 	 kl mean: 7.603417873382568 	 loss mean: 116.14646911621094
nll mean: 108.90625 	 kl mean: 7.603417873382568 	 loss mean: 116.50965881347656
nll mean: 108.8825454711914 	 kl mean: 7.603417873382568 	 loss mean: 116.4859619140625
nll mean: 108.90078735351562 	 kl mean: 7.603417873382568 	 loss mean: 116.50421142578125
nll mean: 108.99466705322266 	 kl mean: 7.603417873382568 	 loss mean: 116.59809112548828


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
100%|██████████| 10/10 [00:00<00:00, 21.53it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.46it/s][A

nll mean: 108.10456085205078 	 kl mean: 7.603417873382568 	 loss mean: 115.70797729492188
nll mean: 121.35223388671875 	 kl mean: 8.457212448120117 	 loss mean: 129.80943298339844
nll mean: 120.62701416015625 	 kl mean: 8.457212448120117 	 loss mean: 129.084228515625


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.46it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 40%|████      | 4/10 [00:00<00:00, 12.51it/s][A

nll mean: 120.46208953857422 	 kl mean: 8.457212448120117 	 loss mean: 128.91929626464844
nll mean: 120.79020690917969 	 kl mean: 8.457212448120117 	 loss mean: 129.24742126464844
nll mean: 120.78482055664062 	 kl mean: 8.457212448120117 	 loss mean: 129.24203491210938


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 40%|████      | 4/10 [00:00<00:00, 12.51it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.44it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.43it/s][A

nll mean: 120.25282287597656 	 kl mean: 8.457212448120117 	 loss mean: 128.7100372314453
nll mean: 120.96501159667969 	 kl mean: 8.457212448120117 	 loss mean: 129.42221069335938
nll mean: 120.52342224121094 	 kl mean: 8.457212448120117 	 loss mean: 128.9806365966797


                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.43it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.42it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:00,  9.97it/s][A

nll mean: 120.81611633300781 	 kl mean: 8.457212448120117 	 loss mean: 129.27333068847656
nll mean: 120.96893310546875 	 kl mean: 8.457212448120117 	 loss mean: 129.42613220214844
nll mean: 61.959110260009766 	 kl mean: 9.90134334564209 	 loss mean: 71.86045837402344


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 10%|█         | 1/10 [00:00<00:00,  9.97it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00,  9.99it/s]

nll mean: 62.01504898071289 	 kl mean: 9.90134334564209 	 loss mean: 71.91639709472656
nll mean: 62.43655014038086 	 kl mean: 9.90134334564209 	 loss mean: 72.337890625
nll mean: 62.465084075927734 	 kl mean: 9.90134334564209 	 loss mean: 72.36642456054688


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00,  9.99it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.00it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.94it/s][A

nll mean: 62.637420654296875 	 kl mean: 9.90134334564209 	 loss mean: 72.53876495361328
nll mean: 62.269676208496094 	 kl mean: 9.90134334564209 	 loss mean: 72.1710205078125


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.94it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.98it/s][A

nll mean: 62.67879867553711 	 kl mean: 9.90134334564209 	 loss mean: 72.58013916015625
nll mean: 62.566062927246094 	 kl mean: 9.90134334564209 	 loss mean: 72.4674072265625
nll mean: 62.52067565917969 	 kl mean: 9.90134334564209 	 loss mean: 72.42201232910156


                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.98it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.06it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.88it/s][A

nll mean: 62.68451690673828 	 kl mean: 9.90134334564209 	 loss mean: 72.58586120605469
nll mean: 104.74037170410156 	 kl mean: 8.8842191696167 	 loss mean: 113.62460327148438
nll mean: 105.52989959716797 	 kl mean: 8.8842191696167 	 loss mean: 114.41412353515625


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 20%|██        | 2/10 [00:00<00:00, 12.88it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 40%|████      | 4/10 [00:00<00:00, 12.75it/s][A

nll mean: 105.976318359375 	 kl mean: 8.8842191696167 	 loss mean: 114.86054229736328
nll mean: 105.22676086425781 	 kl mean: 8.8842191696167 	 loss mean: 114.11097717285156
nll mean: 105.71351623535156 	 kl mean: 8.8842191696167 	 loss mean: 114.59774780273438


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 40%|████      | 4/10 [00:00<00:00, 12.75it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.68it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.58it/s][A

nll mean: 105.4488525390625 	 kl mean: 8.8842191696167 	 loss mean: 114.33307647705078
nll mean: 105.56929779052734 	 kl mean: 8.8842191696167 	 loss mean: 114.45352172851562
nll mean: 105.73584747314453 	 kl mean: 8.8842191696167 	 loss mean: 114.62007141113281


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.58it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.51it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.32it/s]
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 105.58805847167969 	 kl mean: 8.8842191696167 	 loss mean: 114.47227478027344
nll mean: 105.43014526367188 	 kl mean: 8.8842191696167 	 loss mean: 114.31436920166016
nll mean: 138.6877899169922 	 kl mean: 9.011273384094238 	 loss mean: 147.69906616210938


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 20%|██        | 2/10 [00:00<00:00, 10.00it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]

nll mean: 138.4357452392578 	 kl mean: 9.011273384094238 	 loss mean: 147.44700622558594
nll mean: 138.95455932617188 	 kl mean: 9.011273384094238 	 loss mean: 147.96585083007812
nll mean: 138.88650512695312 	 kl mean: 9.011273384094238 	 loss mean: 147.89776611328125



                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00,  9.97it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.00it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.93it/s][A

nll mean: 138.67257690429688 	 kl mean: 9.011273384094238 	 loss mean: 147.68386840820312
nll mean: 138.6710205078125 	 kl mean: 9.011273384094238 	 loss mean: 147.68228149414062


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.93it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.88it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.79it/s][A

nll mean: 138.52040100097656 	 kl mean: 9.011273384094238 	 loss mean: 147.53167724609375
nll mean: 138.37167358398438 	 kl mean: 9.011273384094238 	 loss mean: 147.3829345703125


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 80%|████████  | 8/10 [00:01<00:00,  9.79it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.90it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.20it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 138.38134765625 	 kl mean: 9.011273384094238 	 loss mean: 147.39260864257812
nll mean: 138.37332153320312 	 kl mean: 9.011273384094238 	 loss mean: 147.38458251953125
nll mean: 63.248443603515625 	 kl mean: 8.507553100585938 	 loss mean: 71.75599670410156
nll mean: 63.779296875 	 kl mean: 8.507553100585938 	 loss mean: 72.28684997558594


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
 30%|███       | 3/10 [00:00<00:00, 25.92it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.65it/s][A

nll mean: 62.986732482910156 	 kl mean: 8.507553100585938 	 loss mean: 71.49427795410156
nll mean: 63.15215301513672 	 kl mean: 8.507553100585938 	 loss mean: 71.65970611572266
nll mean: 62.937557220458984 	 kl mean: 8.507553100585938 	 loss mean: 71.44510650634766
nll mean: 62.495750427246094 	 kl mean: 8.507553100585938 	 loss mean: 71.00330352783203
nll mean: 63.460086822509766 	 kl mean: 8.507553100585938 	 loss mean: 71.96763610839844
nll mean: 63.09877014160156 	 kl mean: 8.507553100585938 	 loss mean: 71.6063232421875


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.65it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
100%|██████████| 10/10 [00:00<00:00, 25.40it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 21.54it/s][A

nll mean: 63.422523498535156 	 kl mean: 8.507553100585938 	 loss mean: 71.9300765991211
nll mean: 63.337486267089844 	 kl mean: 8.507553100585938 	 loss mean: 71.84503936767578
nll mean: 118.8221435546875 	 kl mean: 7.8592352867126465 	 loss mean: 126.6813735961914
nll mean: 119.04969787597656 	 kl mean: 7.8592352867126465 	 loss mean: 126.90892791748047
nll mean: 119.28470611572266 	 kl mean: 7.8592352867126465 	 loss mean: 127.14395141601562


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 30%|███       | 3/10 [00:00<00:00, 21.54it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.40it/s][A

nll mean: 119.0274658203125 	 kl mean: 7.8592352867126465 	 loss mean: 126.8866958618164
nll mean: 119.03652954101562 	 kl mean: 7.8592352867126465 	 loss mean: 126.89576721191406
nll mean: 118.85801696777344 	 kl mean: 7.8592352867126465 	 loss mean: 126.71724700927734
nll mean: 119.14127349853516 	 kl mean: 7.8592352867126465 	 loss mean: 127.00050354003906
nll mean: 119.37617492675781 	 kl mean: 7.8592352867126465 	 loss mean: 127.23539733886719


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.40it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
100%|██████████| 10/10 [00:00<00:00, 21.31it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.69329071044922 	 kl mean: 7.8592352867126465 	 loss mean: 126.55252075195312
nll mean: 119.38629150390625 	 kl mean: 7.8592352867126465 	 loss mean: 127.24552917480469
nll mean: 119.94867706298828 	 kl mean: 8.9373197555542 	 loss mean: 128.88600158691406


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.41it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.41it/s][A

nll mean: 119.46343994140625 	 kl mean: 8.9373197555542 	 loss mean: 128.4007568359375
nll mean: 119.61406707763672 	 kl mean: 8.9373197555542 	 loss mean: 128.5513916015625
nll mean: 119.15935516357422 	 kl mean: 8.9373197555542 	 loss mean: 128.0966796875


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 40%|████      | 4/10 [00:00<00:00, 12.41it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.44it/s][A

nll mean: 119.21328735351562 	 kl mean: 8.9373197555542 	 loss mean: 128.15060424804688
nll mean: 119.18447875976562 	 kl mean: 8.9373197555542 	 loss mean: 128.12179565429688
nll mean: 119.14170837402344 	 kl mean: 8.9373197555542 	 loss mean: 128.07904052734375


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.44it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.57it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.59it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 119.694580078125 	 kl mean: 8.9373197555542 	 loss mean: 128.63189697265625
nll mean: 119.685302734375 	 kl mean: 8.9373197555542 	 loss mean: 128.62261962890625
nll mean: 119.34813690185547 	 kl mean: 8.9373197555542 	 loss mean: 128.28546142578125


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.47it/s]
 20%|██        | 2/10 [00:00<00:00, 10.65it/s][A

nll mean: 113.63546752929688 	 kl mean: 8.122859954833984 	 loss mean: 121.7583236694336
nll mean: 113.81480407714844 	 kl mean: 8.122859954833984 	 loss mean: 121.93766021728516
nll mean: 113.5479507446289 	 kl mean: 8.122859954833984 	 loss mean: 121.67080688476562


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s]
 20%|██        | 2/10 [00:00<00:00, 10.65it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s]
 40%|████      | 4/10 [00:00<00:00, 10.63it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.64it/s][A

nll mean: 114.18846893310547 	 kl mean: 8.122859954833984 	 loss mean: 122.31132507324219
nll mean: 113.39492797851562 	 kl mean: 8.122859954833984 	 loss mean: 121.51779174804688
nll mean: 113.35441589355469 	 kl mean: 8.122859954833984 	 loss mean: 121.47727966308594


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.64it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.62it/s][A

nll mean: 114.301513671875 	 kl mean: 8.122859954833984 	 loss mean: 122.42437744140625
nll mean: 113.24547576904297 	 kl mean: 8.122859954833984 	 loss mean: 121.36833190917969
nll mean: 114.45834350585938 	 kl mean: 8.122859954833984 	 loss mean: 122.58120727539062


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.62it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.62it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00, 22.29it/s][A

nll mean: 113.93492889404297 	 kl mean: 8.122859954833984 	 loss mean: 122.05778503417969
nll mean: 112.88363647460938 	 kl mean: 8.287863731384277 	 loss mean: 121.17150115966797
nll mean: 112.12333679199219 	 kl mean: 8.287863731384277 	 loss mean: 120.41120910644531
nll mean: 112.8028564453125 	 kl mean: 8.287863731384277 	 loss mean: 121.0907211303711
nll mean: 112.22639465332031 	 kl mean: 8.287863731384277 	 loss mean: 120.5142593383789


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00, 22.29it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.32it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.98it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.50it/s][A

nll mean: 112.60842895507812 	 kl mean: 8.287863731384277 	 loss mean: 120.89630126953125
nll mean: 112.65603637695312 	 kl mean: 8.287863731384277 	 loss mean: 120.94389343261719
nll mean: 112.3192138671875 	 kl mean: 8.287863731384277 	 loss mean: 120.60708618164062
nll mean: 111.86892700195312 	 kl mean: 8.287863731384277 	 loss mean: 120.15679931640625
nll mean: 112.21585083007812 	 kl mean: 8.287863731384277 	 loss mean: 120.50371551513672


                                               
 95%|█████████▍| 36/38 [00:24<00:01,  1.32it/s]
100%|██████████| 10/10 [00:00<00:00, 21.52it/s][A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]


nll mean: 112.38578033447266 	 kl mean: 8.287863731384277 	 loss mean: 120.67365264892578
nll mean: 87.47872161865234 	 kl mean: 9.584465026855469 	 loss mean: 97.06318664550781
nll mean: 86.98787689208984 	 kl mean: 9.584465026855469 	 loss mean: 96.57234954833984
nll mean: 86.5304183959961 	 kl mean: 9.584465026855469 	 loss mean: 96.1148910522461
nll mean: 86.46359252929688 	 kl mean: 9.584465026855469 	 loss mean: 96.04805755615234
nll mean: 86.9430160522461 	 kl mean: 9.584465026855469 	 loss mean: 96.52748107910156
nll mean: 87.17574310302734 	 kl mean: 9.584465026855469 	 loss mean: 96.76021575927734


                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 30.81it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
100%|██████████| 10/10 [00:00<00:00, 30.41it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.56it/s]


nll mean: 86.864501953125 	 kl mean: 9.584465026855469 	 loss mean: 96.448974609375
nll mean: 87.01495361328125 	 kl mean: 9.584465026855469 	 loss mean: 96.59941864013672
nll mean: 86.59957885742188 	 kl mean: 9.584465026855469 	 loss mean: 96.18404388427734
nll mean: 86.96469116210938 	 kl mean: 9.584465026855469 	 loss mean: 96.54915618896484
Approximate NLL:
tensor(121.8104, device='cuda:0')
Approximate KL:
tensor(8.4971, device='cuda:0')
Testing took 0:00:25.407683


  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .10it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .10it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 26.10it/s][A

nll mean: 109.2979965209961 	 kl mean: 9.496255874633789 	 loss mean: 118.79425048828125
nll mean: 108.57308959960938 	 kl mean: 9.496255874633789 	 loss mean: 118.06935119628906
nll mean: 109.4521484375 	 kl mean: 9.496255874633789 	 loss mean: 118.94841003417969
nll mean: 108.85159301757812 	 kl mean: 9.496255874633789 	 loss mean: 118.34783935546875
nll mean: 108.64936828613281 	 kl mean: 9.496255874633789 	 loss mean: 118.1456298828125


                                      
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 26.10it/s][A
                                      .65it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .65it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .65it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 25.65it/s][A
                                      .36it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 25.05it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 109.64007568359375 	 kl mean: 9.496255874633789 	 loss mean: 119.1363296508789
nll mean: 108.88551330566406 	 kl mean: 9.496255874633789 	 loss mean: 118.38177490234375
nll mean: 109.0101318359375 	 kl mean: 9.496255874633789 	 loss mean: 118.50637817382812
nll mean: 109.38240814208984 	 kl mean: 9.496255874633789 	 loss mean: 118.87866973876953
nll mean: 109.06995391845703 	 kl mean: 9.496255874633789 	 loss mean: 118.56620788574219


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
 20%|██        | 2/10 [00:00<00:00, 13.75it/s][A

nll mean: 125.71388244628906 	 kl mean: 8.842206954956055 	 loss mean: 134.55609130859375
nll mean: 126.01420593261719 	 kl mean: 8.842206954956055 	 loss mean: 134.85641479492188
nll mean: 126.29507446289062 	 kl mean: 8.842206954956055 	 loss mean: 135.1372833251953


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
 20%|██        | 2/10 [00:00<00:00, 13.75it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
 40%|████      | 4/10 [00:00<00:00, 13.91it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.90it/s][A

nll mean: 126.16473388671875 	 kl mean: 8.842206954956055 	 loss mean: 135.00694274902344
nll mean: 125.95578002929688 	 kl mean: 8.842206954956055 	 loss mean: 134.79798889160156
nll mean: 125.77003479003906 	 kl mean: 8.842206954956055 	 loss mean: 134.61224365234375


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.49it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.90it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.49it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.93it/s][A

nll mean: 125.8786392211914 	 kl mean: 8.842206954956055 	 loss mean: 134.72085571289062
nll mean: 125.72819519042969 	 kl mean: 8.842206954956055 	 loss mean: 134.57040405273438
nll mean: 125.801513671875 	 kl mean: 8.842206954956055 	 loss mean: 134.6437225341797


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.49it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.93it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.01it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
 30%|███       | 3/10 [00:00<00:00, 25.13it/s][A

nll mean: 125.87371826171875 	 kl mean: 8.842206954956055 	 loss mean: 134.71592712402344
nll mean: 99.56550598144531 	 kl mean: 8.339632034301758 	 loss mean: 107.90513610839844
nll mean: 99.44546508789062 	 kl mean: 8.339632034301758 	 loss mean: 107.78509521484375
nll mean: 98.55819702148438 	 kl mean: 8.339632034301758 	 loss mean: 106.8978271484375
nll mean: 98.91456604003906 	 kl mean: 8.339632034301758 	 loss mean: 107.25420379638672


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
 30%|███       | 3/10 [00:00<00:00, 25.13it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.77it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.52it/s][A

nll mean: 100.09017944335938 	 kl mean: 8.339632034301758 	 loss mean: 108.4298095703125
nll mean: 99.44863891601562 	 kl mean: 8.339632034301758 	 loss mean: 107.78827667236328
nll mean: 99.38087463378906 	 kl mean: 8.339632034301758 	 loss mean: 107.72049713134766
nll mean: 99.3169174194336 	 kl mean: 8.339632034301758 	 loss mean: 107.65655517578125
nll mean: 98.93539428710938 	 kl mean: 8.339632034301758 	 loss mean: 107.27503967285156


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.02it/s]
100%|██████████| 10/10 [00:00<00:00, 24.12it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.86it/s][A

nll mean: 99.52694702148438 	 kl mean: 8.339632034301758 	 loss mean: 107.86658477783203
nll mean: 138.0225372314453 	 kl mean: 8.971473693847656 	 loss mean: 146.99400329589844
nll mean: 137.75381469726562 	 kl mean: 8.971473693847656 	 loss mean: 146.72528076171875


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
 20%|██        | 2/10 [00:00<00:00, 10.86it/s][A
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
 40%|████      | 4/10 [00:00<00:00, 10.88it/s][A

nll mean: 138.39306640625 	 kl mean: 8.971473693847656 	 loss mean: 147.36453247070312
nll mean: 137.93447875976562 	 kl mean: 8.971473693847656 	 loss mean: 146.90594482421875
nll mean: 137.84906005859375 	 kl mean: 8.971473693847656 	 loss mean: 146.82052612304688


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
 40%|████      | 4/10 [00:00<00:00, 10.88it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.90it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.89it/s][A

nll mean: 137.9807891845703 	 kl mean: 8.971473693847656 	 loss mean: 146.9522705078125
nll mean: 137.5442657470703 	 kl mean: 8.971473693847656 	 loss mean: 146.51573181152344
nll mean: 137.34136962890625 	 kl mean: 8.971473693847656 	 loss mean: 146.31283569335938


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.89it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.85it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 138.02529907226562 	 kl mean: 8.971473693847656 	 loss mean: 146.99676513671875
nll mean: 138.00469970703125 	 kl mean: 8.971473693847656 	 loss mean: 146.97618103027344
nll mean: 126.76334381103516 	 kl mean: 8.348369598388672 	 loss mean: 135.11170959472656


                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 13.61it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.59it/s][A

nll mean: 126.76251983642578 	 kl mean: 8.348369598388672 	 loss mean: 135.1108856201172
nll mean: 126.91362762451172 	 kl mean: 8.348369598388672 	 loss mean: 135.26199340820312
nll mean: 126.65601348876953 	 kl mean: 8.348369598388672 	 loss mean: 135.00437927246094


                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
 40%|████      | 4/10 [00:00<00:00, 13.59it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.80it/s][A

nll mean: 126.66709899902344 	 kl mean: 8.348369598388672 	 loss mean: 135.01547241210938
nll mean: 126.58465576171875 	 kl mean: 8.348369598388672 	 loss mean: 134.9330291748047
nll mean: 126.75167083740234 	 kl mean: 8.348369598388672 	 loss mean: 135.10003662109375


                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.80it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.65it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.65it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.94it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.98it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 126.74673461914062 	 kl mean: 8.348369598388672 	 loss mean: 135.09510803222656
nll mean: 125.88323974609375 	 kl mean: 8.348369598388672 	 loss mean: 134.2316131591797
nll mean: 126.26432800292969 	 kl mean: 8.348369598388672 	 loss mean: 134.61270141601562


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 13.94it/s][A

nll mean: 122.87944030761719 	 kl mean: 8.242907524108887 	 loss mean: 131.12234497070312
nll mean: 123.24667358398438 	 kl mean: 8.242907524108887 	 loss mean: 131.48959350585938
nll mean: 123.11865997314453 	 kl mean: 8.242907524108887 	 loss mean: 131.36155700683594


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 13.94it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 40%|████      | 4/10 [00:00<00:00, 14.04it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.16it/s][A

nll mean: 122.94143676757812 	 kl mean: 8.242907524108887 	 loss mean: 131.18435668945312
nll mean: 122.81062316894531 	 kl mean: 8.242907524108887 	 loss mean: 131.05352783203125
nll mean: 123.50202941894531 	 kl mean: 8.242907524108887 	 loss mean: 131.74493408203125


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.16it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.13it/s][A

nll mean: 122.87480926513672 	 kl mean: 8.242907524108887 	 loss mean: 131.11773681640625
nll mean: 123.26976013183594 	 kl mean: 8.242907524108887 	 loss mean: 131.51268005371094
nll mean: 122.79978942871094 	 kl mean: 8.242907524108887 	 loss mean: 131.04269409179688


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.13it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.08it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.11it/s][A

nll mean: 122.71611022949219 	 kl mean: 8.242907524108887 	 loss mean: 130.95901489257812
nll mean: 133.74661254882812 	 kl mean: 8.362850189208984 	 loss mean: 142.10946655273438
nll mean: 133.59873962402344 	 kl mean: 8.362850189208984 	 loss mean: 141.9615936279297
nll mean: 133.90518188476562 	 kl mean: 8.362850189208984 	 loss mean: 142.26803588867188
nll mean: 134.1688690185547 	 kl mean: 8.362850189208984 	 loss mean: 142.53172302246094


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.11it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.99it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.77it/s][A

nll mean: 134.31515502929688 	 kl mean: 8.362850189208984 	 loss mean: 142.67800903320312
nll mean: 134.21124267578125 	 kl mean: 8.362850189208984 	 loss mean: 142.5740966796875
nll mean: 134.12417602539062 	 kl mean: 8.362850189208984 	 loss mean: 142.48703002929688
nll mean: 134.1800994873047 	 kl mean: 8.362850189208984 	 loss mean: 142.54295349121094
nll mean: 133.39028930664062 	 kl mean: 8.362850189208984 	 loss mean: 141.7531280517578


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 24.63it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 24.90it/s][A

nll mean: 133.8779754638672 	 kl mean: 8.362850189208984 	 loss mean: 142.24081420898438
nll mean: 105.80086517333984 	 kl mean: 8.345904350280762 	 loss mean: 114.14677429199219
nll mean: 105.55067443847656 	 kl mean: 8.345904350280762 	 loss mean: 113.8965835571289
nll mean: 105.61563110351562 	 kl mean: 8.345904350280762 	 loss mean: 113.96153259277344
nll mean: 106.0063705444336 	 kl mean: 8.345904350280762 	 loss mean: 114.3522720336914


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 24.90it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.92it/s][A
                                              [A

nll mean: 105.47052001953125 	 kl mean: 8.345904350280762 	 loss mean: 113.8164291381836
nll mean: 106.23692321777344 	 kl mean: 8.345904350280762 	 loss mean: 114.58282470703125
nll mean: 105.70361328125 	 kl mean: 8.345904350280762 	 loss mean: 114.04952239990234
nll mean: 105.70167541503906 	 kl mean: 8.345904350280762 	 loss mean: 114.04757690429688
nll mean: 106.0916976928711 	 kl mean: 8.345904350280762 	 loss mean: 114.43760681152344



 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
100%|██████████| 10/10 [00:00<00:00, 24.86it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.00it/s][A

nll mean: 105.71598815917969 	 kl mean: 8.345904350280762 	 loss mean: 114.06189727783203
nll mean: 130.94143676757812 	 kl mean: 9.30420970916748 	 loss mean: 140.24563598632812
nll mean: 131.5760498046875 	 kl mean: 9.30420970916748 	 loss mean: 140.88027954101562


                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
 20%|██        | 2/10 [00:00<00:00, 14.00it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 40%|████      | 4/10 [00:00<00:00, 14.36it/s]

nll mean: 131.8358154296875 	 kl mean: 9.30420970916748 	 loss mean: 141.1400146484375
nll mean: 131.67959594726562 	 kl mean: 9.30420970916748 	 loss mean: 140.98379516601562
nll mean: 131.7520751953125 	 kl mean: 9.30420970916748 	 loss mean: 141.05628967285156
nll mean: 131.36016845703125 	 kl mean: 9.30420970916748 	 loss mean: 140.6643829345703


[A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.34it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.67it/s][A

nll mean: 132.2386474609375 	 kl mean: 9.30420970916748 	 loss mean: 141.54287719726562
nll mean: 132.11953735351562 	 kl mean: 9.30420970916748 	 loss mean: 141.42373657226562
nll mean: 131.34600830078125 	 kl mean: 9.30420970916748 	 loss mean: 140.6502227783203


                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.67it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.68it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.48it/s][A

nll mean: 131.9410400390625 	 kl mean: 9.30420970916748 	 loss mean: 141.2452392578125
nll mean: 129.1566925048828 	 kl mean: 8.988276481628418 	 loss mean: 138.1449737548828
nll mean: 129.60983276367188 	 kl mean: 8.988276481628418 	 loss mean: 138.59811401367188
nll mean: 129.00759887695312 	 kl mean: 8.988276481628418 	 loss mean: 137.99588012695312
nll mean: 129.8663787841797 	 kl mean: 8.988276481628418 	 loss mean: 138.85464477539062


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.48it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.37it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.35it/s][A

nll mean: 130.03968811035156 	 kl mean: 8.988276481628418 	 loss mean: 139.02796936035156
nll mean: 129.42076110839844 	 kl mean: 8.988276481628418 	 loss mean: 138.40902709960938
nll mean: 129.93743896484375 	 kl mean: 8.988276481628418 	 loss mean: 138.92572021484375
nll mean: 129.7987060546875 	 kl mean: 8.988276481628418 	 loss mean: 138.7869873046875
nll mean: 129.6175537109375 	 kl mean: 8.988276481628418 	 loss mean: 138.6058349609375


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
100%|██████████| 10/10 [00:00<00:00, 21.30it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
 30%|███       | 3/10 [00:00<00:00, 24.98it/s][A

nll mean: 128.92068481445312 	 kl mean: 8.988276481628418 	 loss mean: 137.90895080566406
nll mean: 118.53816223144531 	 kl mean: 9.2249116897583 	 loss mean: 127.76307678222656
nll mean: 118.19429016113281 	 kl mean: 9.2249116897583 	 loss mean: 127.41920471191406
nll mean: 119.09522247314453 	 kl mean: 9.2249116897583 	 loss mean: 128.32012939453125
nll mean: 118.59200286865234 	 kl mean: 9.2249116897583 	 loss mean: 127.8169174194336


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
 30%|███       | 3/10 [00:00<00:00, 24.98it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.96it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.88it/s][A

nll mean: 118.16336822509766 	 kl mean: 9.2249116897583 	 loss mean: 127.3882827758789
nll mean: 118.34969329833984 	 kl mean: 9.2249116897583 	 loss mean: 127.5746078491211
nll mean: 117.9564208984375 	 kl mean: 9.2249116897583 	 loss mean: 127.18132781982422
nll mean: 118.257568359375 	 kl mean: 9.2249116897583 	 loss mean: 127.48249816894531
nll mean: 118.64949035644531 	 kl mean: 9.2249116897583 	 loss mean: 127.8743896484375


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s]
100%|██████████| 10/10 [00:00<00:00, 24.78it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 30%|███       | 3/10 [00:00<00:00, 21.71it/s][A

nll mean: 118.56352996826172 	 kl mean: 9.2249116897583 	 loss mean: 127.78844451904297
nll mean: 141.35223388671875 	 kl mean: 9.030508041381836 	 loss mean: 150.38275146484375
nll mean: 141.21749877929688 	 kl mean: 9.030508041381836 	 loss mean: 150.24801635742188
nll mean: 140.2584686279297 	 kl mean: 9.030508041381836 	 loss mean: 149.28897094726562
nll mean: 140.80455017089844 	 kl mean: 9.030508041381836 	 loss mean: 149.83505249023438


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 30%|███       | 3/10 [00:00<00:00, 21.71it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.53it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.46it/s][A

nll mean: 141.2103729248047 	 kl mean: 9.030508041381836 	 loss mean: 150.24087524414062
nll mean: 140.89369201660156 	 kl mean: 9.030508041381836 	 loss mean: 149.92420959472656
nll mean: 140.81996154785156 	 kl mean: 9.030508041381836 	 loss mean: 149.8504638671875
nll mean: 140.92164611816406 	 kl mean: 9.030508041381836 	 loss mean: 149.9521484375
nll mean: 140.57247924804688 	 kl mean: 9.030508041381836 	 loss mean: 149.6029815673828


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.99it/s]
100%|██████████| 10/10 [00:00<00:00, 21.32it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.42it/s][A

nll mean: 141.07962036132812 	 kl mean: 9.030508041381836 	 loss mean: 150.110107421875
nll mean: 119.97650146484375 	 kl mean: 9.246963500976562 	 loss mean: 129.2234649658203
nll mean: 119.70523071289062 	 kl mean: 9.246963500976562 	 loss mean: 128.9521942138672


                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 20%|██        | 2/10 [00:00<00:00, 12.42it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 40%|████      | 4/10 [00:00<00:00, 12.50it/s][A

nll mean: 120.44776916503906 	 kl mean: 9.246963500976562 	 loss mean: 129.69473266601562
nll mean: 119.68614196777344 	 kl mean: 9.246963500976562 	 loss mean: 128.93310546875
nll mean: 119.9529800415039 	 kl mean: 9.246963500976562 	 loss mean: 129.199951171875


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 40%|████      | 4/10 [00:00<00:00, 12.50it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.53it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A

nll mean: 119.90866088867188 	 kl mean: 9.246963500976562 	 loss mean: 129.1556396484375
nll mean: 120.00702667236328 	 kl mean: 9.246963500976562 	 loss mean: 129.25399780273438
nll mean: 120.11553955078125 	 kl mean: 9.246963500976562 	 loss mean: 129.3625030517578


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.51it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:00,  9.99it/s][A

nll mean: 119.78024291992188 	 kl mean: 9.246963500976562 	 loss mean: 129.02720642089844
nll mean: 119.54951477050781 	 kl mean: 9.246963500976562 	 loss mean: 128.79647827148438
nll mean: 161.32937622070312 	 kl mean: 9.221147537231445 	 loss mean: 170.55050659179688


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 10%|█         | 1/10 [00:00<00:00,  9.99it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 20%|██        | 2/10 [00:00<00:00,  9.90it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.85it/s][A

nll mean: 160.79684448242188 	 kl mean: 9.221147537231445 	 loss mean: 170.0179901123047
nll mean: 160.17337036132812 	 kl mean: 9.221147537231445 	 loss mean: 169.39451599121094


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00,  9.85it/s][A
                                               [A
[A                                           

nll mean: 160.3596954345703 	 kl mean: 9.221147537231445 	 loss mean: 169.58084106445312
nll mean: 160.96453857421875 	 kl mean: 9.221147537231445 	 loss mean: 170.18569946289062


 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.92it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.90it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.88it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.87it/s][A

nll mean: 160.2887725830078 	 kl mean: 9.221147537231445 	 loss mean: 169.50991821289062
nll mean: 160.79110717773438 	 kl mean: 9.221147537231445 	 loss mean: 170.01226806640625
nll mean: 160.47293090820312 	 kl mean: 9.221147537231445 	 loss mean: 169.69407653808594


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.87it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.89it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.88it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 160.97254943847656 	 kl mean: 9.221147537231445 	 loss mean: 170.19369506835938
nll mean: 160.78428649902344 	 kl mean: 9.221147537231445 	 loss mean: 170.00543212890625
nll mean: 135.12417602539062 	 kl mean: 8.340372085571289 	 loss mean: 143.46453857421875


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.31it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 18.05it/s][A

nll mean: 134.84979248046875 	 kl mean: 8.340372085571289 	 loss mean: 143.19015502929688
nll mean: 135.0140380859375 	 kl mean: 8.340372085571289 	 loss mean: 143.35440063476562
nll mean: 134.66616821289062 	 kl mean: 8.340372085571289 	 loss mean: 143.00653076171875
nll mean: 135.0622100830078 	 kl mean: 8.340372085571289 	 loss mean: 143.402587890625


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 18.05it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 18.03it/s][A
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 18.01it/s][A

nll mean: 134.66607666015625 	 kl mean: 8.340372085571289 	 loss mean: 143.00643920898438
nll mean: 134.73146057128906 	 kl mean: 8.340372085571289 	 loss mean: 143.07183837890625
nll mean: 135.08779907226562 	 kl mean: 8.340372085571289 	 loss mean: 143.42816162109375
nll mean: 134.7519073486328 	 kl mean: 8.340372085571289 	 loss mean: 143.09226989746094


                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 18.01it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.93it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.43it/s][A

nll mean: 135.41769409179688 	 kl mean: 8.340372085571289 	 loss mean: 143.75807189941406
nll mean: 142.656005859375 	 kl mean: 8.882591247558594 	 loss mean: 151.53858947753906
nll mean: 143.3074951171875 	 kl mean: 8.882591247558594 	 loss mean: 152.19009399414062


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 20%|██        | 2/10 [00:00<00:00, 10.43it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 40%|████      | 4/10 [00:00<00:00, 10.54it/s][A

nll mean: 142.606689453125 	 kl mean: 8.882591247558594 	 loss mean: 151.4892578125
nll mean: 142.78240966796875 	 kl mean: 8.882591247558594 	 loss mean: 151.6649932861328
nll mean: 143.30859375 	 kl mean: 8.882591247558594 	 loss mean: 152.19119262695312


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 40%|████      | 4/10 [00:00<00:00, 10.54it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.63it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.64it/s][A

nll mean: 143.19424438476562 	 kl mean: 8.882591247558594 	 loss mean: 152.07684326171875
nll mean: 143.2314910888672 	 kl mean: 8.882591247558594 	 loss mean: 152.11407470703125
nll mean: 142.79437255859375 	 kl mean: 8.882591247558594 	 loss mean: 151.67697143554688


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:10<00:15,  1.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.64it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.64it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 143.06881713867188 	 kl mean: 8.882591247558594 	 loss mean: 151.951416015625
nll mean: 142.78302001953125 	 kl mean: 8.882591247558594 	 loss mean: 151.66558837890625
nll mean: 144.78900146484375 	 kl mean: 7.767889976501465 	 loss mean: 152.556884765625
nll mean: 144.9837646484375 	 kl mean: 7.767889976501465 	 loss mean: 152.75164794921875


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 24.73it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.48it/s][A

nll mean: 144.84866333007812 	 kl mean: 7.767889976501465 	 loss mean: 152.61656188964844
nll mean: 144.66009521484375 	 kl mean: 7.767889976501465 	 loss mean: 152.427978515625
nll mean: 144.81370544433594 	 kl mean: 7.767889976501465 	 loss mean: 152.5815887451172
nll mean: 144.68450927734375 	 kl mean: 7.767889976501465 	 loss mean: 152.452392578125
nll mean: 145.04615783691406 	 kl mean: 7.767889976501465 	 loss mean: 152.8140411376953


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.48it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
100%|██████████| 10/10 [00:00<00:00, 24.32it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 144.95806884765625 	 kl mean: 7.767889976501465 	 loss mean: 152.7259521484375
nll mean: 144.60806274414062 	 kl mean: 7.767889976501465 	 loss mean: 152.37594604492188
nll mean: 144.80030822753906 	 kl mean: 7.767889976501465 	 loss mean: 152.5681915283203
nll mean: 133.72506713867188 	 kl mean: 8.83085823059082 	 loss mean: 142.555908203125
nll mean: 133.86016845703125 	 kl mean: 8.83085823059082 	 loss mean: 142.6910400390625


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 30%|███       | 3/10 [00:00<00:00, 24.73it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.77it/s][A

nll mean: 133.56192016601562 	 kl mean: 8.83085823059082 	 loss mean: 142.3927764892578
nll mean: 133.690185546875 	 kl mean: 8.83085823059082 	 loss mean: 142.5210418701172
nll mean: 133.47341918945312 	 kl mean: 8.83085823059082 	 loss mean: 142.30429077148438
nll mean: 133.7246551513672 	 kl mean: 8.83085823059082 	 loss mean: 142.55551147460938
nll mean: 133.89169311523438 	 kl mean: 8.83085823059082 	 loss mean: 142.72254943847656


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.77it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
100%|██████████| 10/10 [00:00<00:00, 24.71it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 133.71546936035156 	 kl mean: 8.83085823059082 	 loss mean: 142.54632568359375
nll mean: 133.36764526367188 	 kl mean: 8.83085823059082 	 loss mean: 142.198486328125
nll mean: 133.46231079101562 	 kl mean: 8.83085823059082 	 loss mean: 142.2931671142578
nll mean: 128.39697265625 	 kl mean: 9.476274490356445 	 loss mean: 137.8732452392578


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 20%|██        | 2/10 [00:00<00:00, 12.30it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.30it/s][A

nll mean: 129.13031005859375 	 kl mean: 9.476274490356445 	 loss mean: 138.6065673828125
nll mean: 128.819091796875 	 kl mean: 9.476274490356445 	 loss mean: 138.2953643798828
nll mean: 128.96728515625 	 kl mean: 9.476274490356445 	 loss mean: 138.44357299804688


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 40%|████      | 4/10 [00:00<00:00, 12.30it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.50it/s][A

nll mean: 128.49119567871094 	 kl mean: 9.476274490356445 	 loss mean: 137.96746826171875
nll mean: 129.021240234375 	 kl mean: 9.476274490356445 	 loss mean: 138.4975128173828
nll mean: 128.33816528320312 	 kl mean: 9.476274490356445 	 loss mean: 137.814453125


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.50it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.60it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.62it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 129.12066650390625 	 kl mean: 9.476274490356445 	 loss mean: 138.596923828125
nll mean: 129.4293975830078 	 kl mean: 9.476274490356445 	 loss mean: 138.90567016601562
nll mean: 128.94549560546875 	 kl mean: 9.476274490356445 	 loss mean: 138.42178344726562


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 12.78it/s][A

nll mean: 149.1558380126953 	 kl mean: 9.006087303161621 	 loss mean: 158.16192626953125
nll mean: 149.50994873046875 	 kl mean: 9.006087303161621 	 loss mean: 158.51605224609375
nll mean: 149.216064453125 	 kl mean: 9.006087303161621 	 loss mean: 158.22216796875


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 12.78it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 40%|████      | 4/10 [00:00<00:00, 12.68it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.53it/s][A

nll mean: 149.8382568359375 	 kl mean: 9.006087303161621 	 loss mean: 158.84434509277344
nll mean: 149.13552856445312 	 kl mean: 9.006087303161621 	 loss mean: 158.1416015625
nll mean: 149.43185424804688 	 kl mean: 9.006087303161621 	 loss mean: 158.43792724609375


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.53it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.51it/s][A

nll mean: 149.43585205078125 	 kl mean: 9.006087303161621 	 loss mean: 158.4419403076172
nll mean: 149.44012451171875 	 kl mean: 9.006087303161621 	 loss mean: 158.4462127685547
nll mean: 149.38009643554688 	 kl mean: 9.006087303161621 	 loss mean: 158.38619995117188


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.51it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.47it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.58it/s][A

nll mean: 149.09698486328125 	 kl mean: 9.006087303161621 	 loss mean: 158.1030731201172
nll mean: 156.7175750732422 	 kl mean: 8.584087371826172 	 loss mean: 165.30166625976562
nll mean: 156.18905639648438 	 kl mean: 8.584087371826172 	 loss mean: 164.77313232421875


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 20%|██        | 2/10 [00:00<00:00, 12.58it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 40%|████      | 4/10 [00:00<00:00, 12.71it/s][A

nll mean: 156.6441192626953 	 kl mean: 8.584087371826172 	 loss mean: 165.22821044921875
nll mean: 156.61572265625 	 kl mean: 8.584087371826172 	 loss mean: 165.19981384277344
nll mean: 155.90016174316406 	 kl mean: 8.584087371826172 	 loss mean: 164.4842529296875


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 40%|████      | 4/10 [00:00<00:00, 12.71it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.71it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.65it/s][A

nll mean: 156.64866638183594 	 kl mean: 8.584087371826172 	 loss mean: 165.23275756835938
nll mean: 156.6305694580078 	 kl mean: 8.584087371826172 	 loss mean: 165.2146453857422
nll mean: 156.7568359375 	 kl mean: 8.584087371826172 	 loss mean: 165.3409423828125


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.65it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 157.0956573486328 	 kl mean: 8.584087371826172 	 loss mean: 165.67974853515625
nll mean: 157.29771423339844 	 kl mean: 8.584087371826172 	 loss mean: 165.88180541992188
nll mean: 117.23689270019531 	 kl mean: 8.98953628540039 	 loss mean: 126.22643280029297


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 10.32it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.28it/s][A

nll mean: 117.20877838134766 	 kl mean: 8.98953628540039 	 loss mean: 126.19832611083984
nll mean: 117.86503601074219 	 kl mean: 8.98953628540039 	 loss mean: 126.85456848144531
nll mean: 117.29732513427734 	 kl mean: 8.98953628540039 	 loss mean: 126.28684997558594


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 40%|████      | 4/10 [00:00<00:00, 10.28it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.29it/s][A

nll mean: 117.05194854736328 	 kl mean: 8.98953628540039 	 loss mean: 126.0414810180664
nll mean: 117.87541198730469 	 kl mean: 8.98953628540039 	 loss mean: 126.86494445800781
nll mean: 117.44114685058594 	 kl mean: 8.98953628540039 	 loss mean: 126.43067932128906


                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.29it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.27it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.27it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 117.59074401855469 	 kl mean: 8.98953628540039 	 loss mean: 126.58028411865234
nll mean: 117.59268951416016 	 kl mean: 8.98953628540039 	 loss mean: 126.58222198486328
nll mean: 117.7298355102539 	 kl mean: 8.98953628540039 	 loss mean: 126.71937561035156


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 33.76it/s][A

nll mean: 106.39957427978516 	 kl mean: 7.661587715148926 	 loss mean: 114.0611572265625
nll mean: 106.65582275390625 	 kl mean: 7.661587715148926 	 loss mean: 114.31741333007812
nll mean: 106.338623046875 	 kl mean: 7.661587715148926 	 loss mean: 114.00021362304688
nll mean: 106.00556945800781 	 kl mean: 7.661587715148926 	 loss mean: 113.66715240478516
nll mean: 106.01493835449219 	 kl mean: 7.661587715148926 	 loss mean: 113.67652893066406
nll mean: 105.95958709716797 	 kl mean: 7.661587715148926 	 loss mean: 113.62118530273438
nll mean: 106.13046264648438 	 kl mean: 7.661587715148926 	 loss mean: 113.79204559326172


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 33.76it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
100%|██████████| 10/10 [00:00<00:00, 32.95it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
                                               


nll mean: 106.46005249023438 	 kl mean: 7.661587715148926 	 loss mean: 114.12162780761719
nll mean: 105.86808013916016 	 kl mean: 7.661587715148926 	 loss mean: 113.5296630859375
nll mean: 106.87489318847656 	 kl mean: 7.661587715148926 	 loss mean: 114.5364761352539
nll mean: 159.4384765625 	 kl mean: 8.410591125488281 	 loss mean: 167.84906005859375


 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
 20%|██        | 2/10 [00:00<00:00, 14.66it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.65it/s][A

nll mean: 159.70413208007812 	 kl mean: 8.410591125488281 	 loss mean: 168.11474609375
nll mean: 159.107421875 	 kl mean: 8.410591125488281 	 loss mean: 167.5180206298828
nll mean: 159.6287841796875 	 kl mean: 8.410591125488281 	 loss mean: 168.03936767578125


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
 40%|████      | 4/10 [00:00<00:00, 14.65it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.64it/s][A

nll mean: 159.333251953125 	 kl mean: 8.410591125488281 	 loss mean: 167.74383544921875
nll mean: 159.71792602539062 	 kl mean: 8.410591125488281 	 loss mean: 168.12852478027344
nll mean: 159.1493377685547 	 kl mean: 8.410591125488281 	 loss mean: 167.5599365234375


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.64it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.64it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.67it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 159.526123046875 	 kl mean: 8.410591125488281 	 loss mean: 167.93670654296875
nll mean: 159.57186889648438 	 kl mean: 8.410591125488281 	 loss mean: 167.98245239257812
nll mean: 159.24607849121094 	 kl mean: 8.410591125488281 	 loss mean: 167.65667724609375
nll mean: 120.21087646484375 	 kl mean: 9.603468894958496 	 loss mean: 129.8143310546875


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 21.88it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.80it/s][A

nll mean: 120.01866912841797 	 kl mean: 9.603468894958496 	 loss mean: 129.6221466064453
nll mean: 120.45690155029297 	 kl mean: 9.603468894958496 	 loss mean: 130.06036376953125
nll mean: 121.04808807373047 	 kl mean: 9.603468894958496 	 loss mean: 130.65155029296875
nll mean: 120.51199340820312 	 kl mean: 9.603468894958496 	 loss mean: 130.11544799804688
nll mean: 120.09284973144531 	 kl mean: 9.603468894958496 	 loss mean: 129.69631958007812


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.80it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 21.36it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.375732421875 	 kl mean: 9.603468894958496 	 loss mean: 129.97921752929688
nll mean: 120.54586029052734 	 kl mean: 9.603468894958496 	 loss mean: 130.14932250976562
nll mean: 120.60905456542969 	 kl mean: 9.603468894958496 	 loss mean: 130.2125244140625
nll mean: 120.48909759521484 	 kl mean: 9.603468894958496 	 loss mean: 130.09255981445312


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 14.68it/s][A

nll mean: 113.99627685546875 	 kl mean: 8.427966117858887 	 loss mean: 122.42425537109375
nll mean: 113.95446014404297 	 kl mean: 8.427966117858887 	 loss mean: 122.38241577148438
nll mean: 114.40303802490234 	 kl mean: 8.427966117858887 	 loss mean: 122.83100891113281


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 14.68it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 40%|████      | 4/10 [00:00<00:00, 14.76it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.74it/s][A

nll mean: 114.2369384765625 	 kl mean: 8.427966117858887 	 loss mean: 122.66490173339844
nll mean: 113.91110229492188 	 kl mean: 8.427966117858887 	 loss mean: 122.33905792236328
nll mean: 113.37543487548828 	 kl mean: 8.427966117858887 	 loss mean: 121.80340576171875


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.74it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.76it/s][A

nll mean: 114.14108276367188 	 kl mean: 8.427966117858887 	 loss mean: 122.56904602050781
nll mean: 113.47877502441406 	 kl mean: 8.427966117858887 	 loss mean: 121.90674591064453
nll mean: 113.83824157714844 	 kl mean: 8.427966117858887 	 loss mean: 122.26620483398438


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.76it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.78it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00, 23.03it/s][A

nll mean: 113.94061279296875 	 kl mean: 8.427966117858887 	 loss mean: 122.36857604980469
nll mean: 82.7533187866211 	 kl mean: 7.687598705291748 	 loss mean: 90.44091033935547
nll mean: 82.14282989501953 	 kl mean: 7.687598705291748 	 loss mean: 89.83042907714844
nll mean: 82.63581848144531 	 kl mean: 7.687598705291748 	 loss mean: 90.32342529296875
nll mean: 82.69956970214844 	 kl mean: 7.687598705291748 	 loss mean: 90.38717651367188


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00, 23.03it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.62it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.94it/s][A

nll mean: 82.61527252197266 	 kl mean: 7.687598705291748 	 loss mean: 90.30287170410156
nll mean: 82.18357849121094 	 kl mean: 7.687598705291748 	 loss mean: 89.87118530273438
nll mean: 82.17113494873047 	 kl mean: 7.687598705291748 	 loss mean: 89.85873413085938
nll mean: 82.09765625 	 kl mean: 7.687598705291748 	 loss mean: 89.7852554321289
nll mean: 82.56560516357422 	 kl mean: 7.687598705291748 	 loss mean: 90.25320434570312


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.60it/s]
100%|██████████| 10/10 [00:00<00:00, 21.80it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.45it/s][A

nll mean: 82.69154357910156 	 kl mean: 7.687598705291748 	 loss mean: 90.37914276123047
nll mean: 108.41007995605469 	 kl mean: 7.956856727600098 	 loss mean: 116.366943359375
nll mean: 109.20088195800781 	 kl mean: 7.956856727600098 	 loss mean: 117.15773010253906
nll mean: 108.53692626953125 	 kl mean: 7.956856727600098 	 loss mean: 116.49378967285156
nll mean: 108.94611358642578 	 kl mean: 7.956856727600098 	 loss mean: 116.90296173095703


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.45it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.29it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.22it/s][A

nll mean: 108.97547912597656 	 kl mean: 7.956856727600098 	 loss mean: 116.93234252929688
nll mean: 109.54049682617188 	 kl mean: 7.956856727600098 	 loss mean: 117.49735260009766
nll mean: 109.26689147949219 	 kl mean: 7.956856727600098 	 loss mean: 117.2237548828125
nll mean: 108.79777526855469 	 kl mean: 7.956856727600098 	 loss mean: 116.754638671875
nll mean: 108.94243621826172 	 kl mean: 7.956856727600098 	 loss mean: 116.8992919921875


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
100%|██████████| 10/10 [00:00<00:00, 21.01it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 11.99it/s][A

nll mean: 109.33455657958984 	 kl mean: 7.956856727600098 	 loss mean: 117.29141235351562
nll mean: 120.78358459472656 	 kl mean: 8.521693229675293 	 loss mean: 129.30526733398438
nll mean: 121.56137084960938 	 kl mean: 8.521693229675293 	 loss mean: 130.08306884765625


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
 20%|██        | 2/10 [00:00<00:00, 11.99it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
 40%|████      | 4/10 [00:00<00:00, 12.03it/s][A

nll mean: 121.032470703125 	 kl mean: 8.521693229675293 	 loss mean: 129.55416870117188
nll mean: 121.95963287353516 	 kl mean: 8.521693229675293 	 loss mean: 130.4813232421875
nll mean: 121.27275085449219 	 kl mean: 8.521693229675293 	 loss mean: 129.79443359375


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
 40%|████      | 4/10 [00:00<00:00, 12.03it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.17it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.13it/s][A

nll mean: 121.09463500976562 	 kl mean: 8.521693229675293 	 loss mean: 129.6163330078125
nll mean: 120.90811157226562 	 kl mean: 8.521693229675293 	 loss mean: 129.42979431152344
nll mean: 121.1576156616211 	 kl mean: 8.521693229675293 	 loss mean: 129.67930603027344


                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.83it/s]
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.83it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.13it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.21it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:00,  9.97it/s][A

nll mean: 120.66377258300781 	 kl mean: 8.521693229675293 	 loss mean: 129.18545532226562
nll mean: 121.09529113769531 	 kl mean: 8.521693229675293 	 loss mean: 129.61697387695312
nll mean: 62.17742919921875 	 kl mean: 9.349200248718262 	 loss mean: 71.52662658691406


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]
 10%|█         | 1/10 [00:00<00:00,  9.97it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00,  9.98it/s][A

nll mean: 62.47975158691406 	 kl mean: 9.349200248718262 	 loss mean: 71.82894897460938
nll mean: 62.62038803100586 	 kl mean: 9.349200248718262 	 loss mean: 71.96958923339844
nll mean: 62.39564514160156 	 kl mean: 9.349200248718262 	 loss mean: 71.74484252929688


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00,  9.98it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.04it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.12it/s][A

nll mean: 61.809364318847656 	 kl mean: 9.349200248718262 	 loss mean: 71.15856170654297
nll mean: 62.799041748046875 	 kl mean: 9.349200248718262 	 loss mean: 72.14823913574219
nll mean: 62.4029541015625 	 kl mean: 9.349200248718262 	 loss mean: 71.75215148925781


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.59it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.12it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.59it/s]
                                               [A
                                              

nll mean: 62.71906280517578 	 kl mean: 9.349200248718262 	 loss mean: 72.0682601928711
nll mean: 62.68963623046875 	 kl mean: 9.349200248718262 	 loss mean: 72.03883361816406


 76%|███████▋  | 29/38 [00:19<00:05,  1.59it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.07it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.07it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.94it/s][A

nll mean: 62.41923522949219 	 kl mean: 9.349200248718262 	 loss mean: 71.7684326171875
nll mean: 105.22691345214844 	 kl mean: 9.035836219787598 	 loss mean: 114.26274108886719
nll mean: 105.72367858886719 	 kl mean: 9.035836219787598 	 loss mean: 114.75951385498047


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 20%|██        | 2/10 [00:00<00:00, 12.94it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 40%|████      | 4/10 [00:00<00:00, 12.88it/s][A

nll mean: 105.49923706054688 	 kl mean: 9.035836219787598 	 loss mean: 114.53507995605469
nll mean: 105.8394775390625 	 kl mean: 9.035836219787598 	 loss mean: 114.87530517578125
nll mean: 105.17120361328125 	 kl mean: 9.035836219787598 	 loss mean: 114.20703887939453


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 40%|████      | 4/10 [00:00<00:00, 12.88it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.96it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.87it/s][A

nll mean: 105.27013397216797 	 kl mean: 9.035836219787598 	 loss mean: 114.30596160888672
nll mean: 105.07852172851562 	 kl mean: 9.035836219787598 	 loss mean: 114.1143569946289
nll mean: 105.60604858398438 	 kl mean: 9.035836219787598 	 loss mean: 114.64189910888672


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.35it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.87it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.76it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.33it/s]
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 105.53970336914062 	 kl mean: 9.035836219787598 	 loss mean: 114.57554626464844
nll mean: 105.2430191040039 	 kl mean: 9.035836219787598 	 loss mean: 114.27885437011719
nll mean: 138.01980590820312 	 kl mean: 9.67552661895752 	 loss mean: 147.69534301757812


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 20%|██        | 2/10 [00:00<00:00, 10.16it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]

nll mean: 137.9764404296875 	 kl mean: 9.67552661895752 	 loss mean: 147.65196228027344
nll mean: 138.78347778320312 	 kl mean: 9.67552661895752 	 loss mean: 148.45901489257812
nll mean: 138.2724609375 	 kl mean: 9.67552661895752 	 loss mean: 147.947998046875



                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 10.09it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.05it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.92it/s][A

nll mean: 138.13134765625 	 kl mean: 9.67552661895752 	 loss mean: 147.806884765625
nll mean: 137.85824584960938 	 kl mean: 9.67552661895752 	 loss mean: 147.53378295898438


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.92it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.89it/s][A
                                               [A
[A                                           

nll mean: 137.4623565673828 	 kl mean: 9.67552661895752 	 loss mean: 147.1378936767578
nll mean: 138.0374755859375 	 kl mean: 9.67552661895752 	 loss mean: 147.71298217773438


 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 80%|████████  | 8/10 [00:01<00:00,  9.90it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.91it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.20it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.20it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 137.7833251953125 	 kl mean: 9.67552661895752 	 loss mean: 147.4588623046875
nll mean: 138.12939453125 	 kl mean: 9.67552661895752 	 loss mean: 147.804931640625
nll mean: 62.985984802246094 	 kl mean: 8.161412239074707 	 loss mean: 71.14739990234375
nll mean: 62.96961212158203 	 kl mean: 8.161412239074707 	 loss mean: 71.13101959228516


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
 30%|███       | 3/10 [00:00<00:00, 26.26it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.89it/s][A

nll mean: 62.71034240722656 	 kl mean: 8.161412239074707 	 loss mean: 70.87174987792969
nll mean: 62.91009521484375 	 kl mean: 8.161412239074707 	 loss mean: 71.07150268554688
nll mean: 62.863861083984375 	 kl mean: 8.161412239074707 	 loss mean: 71.02527618408203
nll mean: 62.54871368408203 	 kl mean: 8.161412239074707 	 loss mean: 70.71012115478516
nll mean: 62.736427307128906 	 kl mean: 8.161412239074707 	 loss mean: 70.89784240722656
nll mean: 62.979759216308594 	 kl mean: 8.161412239074707 	 loss mean: 71.14117431640625


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.89it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.20it/s]
100%|██████████| 10/10 [00:00<00:00, 25.44it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 21.59it/s][A

nll mean: 63.826515197753906 	 kl mean: 8.161412239074707 	 loss mean: 71.98793029785156
nll mean: 63.073699951171875 	 kl mean: 8.161412239074707 	 loss mean: 71.235107421875
nll mean: 119.55696105957031 	 kl mean: 7.894026756286621 	 loss mean: 127.45097351074219
nll mean: 120.33560180664062 	 kl mean: 7.894026756286621 	 loss mean: 128.2296142578125
nll mean: 120.36967468261719 	 kl mean: 7.894026756286621 	 loss mean: 128.26370239257812


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 30%|███       | 3/10 [00:00<00:00, 21.59it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.44it/s][A

nll mean: 120.42634582519531 	 kl mean: 7.894026756286621 	 loss mean: 128.32037353515625
nll mean: 119.69029235839844 	 kl mean: 7.894026756286621 	 loss mean: 127.5843276977539
nll mean: 120.30557250976562 	 kl mean: 7.894026756286621 	 loss mean: 128.19960021972656
nll mean: 120.45120239257812 	 kl mean: 7.894026756286621 	 loss mean: 128.34523010253906
nll mean: 119.88679504394531 	 kl mean: 7.894026756286621 	 loss mean: 127.78080749511719


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.44it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
100%|██████████| 10/10 [00:00<00:00, 21.34it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 119.65261840820312 	 kl mean: 7.894026756286621 	 loss mean: 127.5466537475586
nll mean: 120.59593200683594 	 kl mean: 7.894026756286621 	 loss mean: 128.48995971679688
nll mean: 119.76525115966797 	 kl mean: 9.188162803649902 	 loss mean: 128.9534149169922


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.40it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.41it/s][A

nll mean: 120.20420837402344 	 kl mean: 9.188162803649902 	 loss mean: 129.39236450195312
nll mean: 119.8037109375 	 kl mean: 9.188162803649902 	 loss mean: 128.99188232421875
nll mean: 119.70358276367188 	 kl mean: 9.188162803649902 	 loss mean: 128.89173889160156


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 40%|████      | 4/10 [00:00<00:00, 12.41it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.41it/s][A

nll mean: 120.23081970214844 	 kl mean: 9.188162803649902 	 loss mean: 129.41897583007812
nll mean: 120.00543212890625 	 kl mean: 9.188162803649902 	 loss mean: 129.193603515625
nll mean: 119.70576477050781 	 kl mean: 9.188162803649902 	 loss mean: 128.89393615722656


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.41it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.43it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.50it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 119.88957214355469 	 kl mean: 9.188162803649902 	 loss mean: 129.07772827148438
nll mean: 120.37712097167969 	 kl mean: 9.188162803649902 	 loss mean: 129.56527709960938
nll mean: 119.7037353515625 	 kl mean: 9.188162803649902 	 loss mean: 128.89190673828125


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.55it/s][A

nll mean: 112.95719909667969 	 kl mean: 8.613710403442383 	 loss mean: 121.5709228515625
nll mean: 112.83458709716797 	 kl mean: 8.613710403442383 	 loss mean: 121.44830322265625
nll mean: 112.62100219726562 	 kl mean: 8.613710403442383 	 loss mean: 121.2347183227539


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.55it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 10.57it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.60it/s][A

nll mean: 112.84738159179688 	 kl mean: 8.613710403442383 	 loss mean: 121.46109008789062
nll mean: 112.50592803955078 	 kl mean: 8.613710403442383 	 loss mean: 121.11964416503906
nll mean: 112.66898345947266 	 kl mean: 8.613710403442383 	 loss mean: 121.2826919555664


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.60it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.60it/s][A

nll mean: 112.72901153564453 	 kl mean: 8.613710403442383 	 loss mean: 121.34272003173828
nll mean: 112.55009460449219 	 kl mean: 8.613710403442383 	 loss mean: 121.16380310058594
nll mean: 113.33763122558594 	 kl mean: 8.613710403442383 	 loss mean: 121.95134735107422


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.60it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.56it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 22.11it/s][A

nll mean: 112.56301879882812 	 kl mean: 8.613710403442383 	 loss mean: 121.17672729492188
nll mean: 110.64450073242188 	 kl mean: 8.576875686645508 	 loss mean: 119.22137451171875
nll mean: 110.33357238769531 	 kl mean: 8.576875686645508 	 loss mean: 118.91044616699219
nll mean: 110.05084228515625 	 kl mean: 8.576875686645508 	 loss mean: 118.62771606445312
nll mean: 110.04798889160156 	 kl mean: 8.576875686645508 	 loss mean: 118.62486267089844


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 22.11it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.61it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.39it/s][A

nll mean: 110.11531066894531 	 kl mean: 8.576875686645508 	 loss mean: 118.69218444824219
nll mean: 110.19264221191406 	 kl mean: 8.576875686645508 	 loss mean: 118.76951599121094
nll mean: 110.57672882080078 	 kl mean: 8.576875686645508 	 loss mean: 119.15360260009766
nll mean: 110.21990966796875 	 kl mean: 8.576875686645508 	 loss mean: 118.79678344726562
nll mean: 110.07841491699219 	 kl mean: 8.576875686645508 	 loss mean: 118.65528869628906


                                               
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
100%|██████████| 10/10 [00:00<00:00, 21.31it/s][A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 30.69it/s][A

nll mean: 110.27479553222656 	 kl mean: 8.576875686645508 	 loss mean: 118.85166931152344
nll mean: 85.0479736328125 	 kl mean: 9.153246879577637 	 loss mean: 94.20121765136719
nll mean: 85.06493377685547 	 kl mean: 9.153246879577637 	 loss mean: 94.21818542480469
nll mean: 85.28522491455078 	 kl mean: 9.153246879577637 	 loss mean: 94.43846893310547
nll mean: 85.28793334960938 	 kl mean: 9.153246879577637 	 loss mean: 94.44117736816406
nll mean: 84.32131958007812 	 kl mean: 9.153246879577637 	 loss mean: 93.47457122802734
nll mean: 85.20579528808594 	 kl mean: 9.153246879577637 	 loss mean: 94.35905456542969


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 30.69it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
100%|██████████| 10/10 [00:00<00:00, 30.47it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.56it/s]


nll mean: 84.53129577636719 	 kl mean: 9.153246879577637 	 loss mean: 93.68453979492188
nll mean: 85.47044372558594 	 kl mean: 9.153246879577637 	 loss mean: 94.6236801147461
nll mean: 84.83663177490234 	 kl mean: 9.153246879577637 	 loss mean: 93.9898910522461
nll mean: 84.90239715576172 	 kl mean: 9.153246879577637 	 loss mean: 94.05564880371094
Approximate NLL:
tensor(121.3209, device='cuda:0')
Approximate KL:
tensor(8.7278, device='cuda:0')
Testing took 0:00:25.341975


  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 26.00it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].00it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].00it/s][A
                                              

nll mean: 109.03711700439453 	 kl mean: 9.29767894744873 	 loss mean: 118.33480072021484
nll mean: 108.59651184082031 	 kl mean: 9.29767894744873 	 loss mean: 117.8941879272461
nll mean: 108.49610900878906 	 kl mean: 9.29767894744873 	 loss mean: 117.79379272460938
nll mean: 108.91555786132812 	 kl mean: 9.29767894744873 	 loss mean: 118.21322631835938
nll mean: 108.82846069335938 	 kl mean: 9.29767894744873 	 loss mean: 118.12614440917969



  0%|          | 0/38 [00:00<?, ?it/s].00it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.65it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].65it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].65it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].65it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.41it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 25.15it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 109.40126037597656 	 kl mean: 9.29767894744873 	 loss mean: 118.69894409179688
nll mean: 109.58343505859375 	 kl mean: 9.29767894744873 	 loss mean: 118.88111114501953
nll mean: 108.89826202392578 	 kl mean: 9.29767894744873 	 loss mean: 118.19593811035156
nll mean: 108.16291809082031 	 kl mean: 9.29767894744873 	 loss mean: 117.46060180664062
nll mean: 109.15081787109375 	 kl mean: 9.29767894744873 	 loss mean: 118.44850158691406


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 20%|██        | 2/10 [00:00<00:00, 14.06it/s][A

nll mean: 124.83537292480469 	 kl mean: 9.068607330322266 	 loss mean: 133.90399169921875
nll mean: 124.50137329101562 	 kl mean: 9.068607330322266 	 loss mean: 133.56997680664062
nll mean: 125.6463623046875 	 kl mean: 9.068607330322266 	 loss mean: 134.7149658203125


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 20%|██        | 2/10 [00:00<00:00, 14.06it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 40%|████      | 4/10 [00:00<00:00, 14.21it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.17it/s][A

nll mean: 125.51956176757812 	 kl mean: 9.068607330322266 	 loss mean: 134.58816528320312
nll mean: 125.12625885009766 	 kl mean: 9.068607330322266 	 loss mean: 134.1948699951172
nll mean: 124.74075317382812 	 kl mean: 9.068607330322266 	 loss mean: 133.80935668945312


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.17it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.03it/s][A

nll mean: 124.99979400634766 	 kl mean: 9.068607330322266 	 loss mean: 134.06838989257812
nll mean: 124.68885803222656 	 kl mean: 9.068607330322266 	 loss mean: 133.75746154785156
nll mean: 124.59347534179688 	 kl mean: 9.068607330322266 	 loss mean: 133.66207885742188


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.03it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.20it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 30%|███       | 3/10 [00:00<00:00, 24.76it/s][A

nll mean: 124.91152954101562 	 kl mean: 9.068607330322266 	 loss mean: 133.98013305664062
nll mean: 98.56256103515625 	 kl mean: 8.385457992553711 	 loss mean: 106.94801330566406
nll mean: 99.05781555175781 	 kl mean: 8.385457992553711 	 loss mean: 107.44328308105469
nll mean: 98.97940826416016 	 kl mean: 8.385457992553711 	 loss mean: 107.36486053466797
nll mean: 98.75914001464844 	 kl mean: 8.385457992553711 	 loss mean: 107.14459228515625


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 30%|███       | 3/10 [00:00<00:00, 24.76it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.70it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.54it/s][A

nll mean: 99.33894348144531 	 kl mean: 8.385457992553711 	 loss mean: 107.72441101074219
nll mean: 99.5749740600586 	 kl mean: 8.385457992553711 	 loss mean: 107.96043395996094
nll mean: 99.56838989257812 	 kl mean: 8.385457992553711 	 loss mean: 107.953857421875
nll mean: 98.94612121582031 	 kl mean: 8.385457992553711 	 loss mean: 107.33158111572266
nll mean: 98.87952423095703 	 kl mean: 8.385457992553711 	 loss mean: 107.26498413085938


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.03it/s]
100%|██████████| 10/10 [00:00<00:00, 24.51it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.74it/s][A

nll mean: 99.48179626464844 	 kl mean: 8.385457992553711 	 loss mean: 107.86725616455078
nll mean: 138.42813110351562 	 kl mean: 8.801817893981934 	 loss mean: 147.22994995117188
nll mean: 138.13650512695312 	 kl mean: 8.801817893981934 	 loss mean: 146.93833923339844


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
 20%|██        | 2/10 [00:00<00:00, 10.74it/s][A
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.14it/s]
 40%|████      | 4/10 [00:00<00:00, 10.77it/s][A

nll mean: 138.08834838867188 	 kl mean: 8.801817893981934 	 loss mean: 146.89016723632812
nll mean: 137.76516723632812 	 kl mean: 8.801817893981934 	 loss mean: 146.56698608398438
nll mean: 138.1910400390625 	 kl mean: 8.801817893981934 	 loss mean: 146.99285888671875


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.14it/s]
 40%|████      | 4/10 [00:00<00:00, 10.77it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.14it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.14it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.78it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.81it/s][A

nll mean: 137.79888916015625 	 kl mean: 8.801817893981934 	 loss mean: 146.6007080078125
nll mean: 137.66314697265625 	 kl mean: 8.801817893981934 	 loss mean: 146.4649658203125
nll mean: 138.35110473632812 	 kl mean: 8.801817893981934 	 loss mean: 147.15292358398438


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.14it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.14it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.81it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.81it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]

nll mean: 138.48410034179688 	 kl mean: 8.801817893981934 	 loss mean: 147.28591918945312
nll mean: 138.54937744140625 	 kl mean: 8.801817893981934 	 loss mean: 147.3511962890625
nll mean: 125.9752197265625 	 kl mean: 8.548948287963867 	 loss mean: 134.524169921875



                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 13.97it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.88it/s][A

nll mean: 126.58543395996094 	 kl mean: 8.548948287963867 	 loss mean: 135.1343994140625
nll mean: 126.73576354980469 	 kl mean: 8.548948287963867 	 loss mean: 135.28469848632812
nll mean: 127.18584442138672 	 kl mean: 8.548948287963867 	 loss mean: 135.7347869873047



                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.90it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.65it/s][A

nll mean: 126.69328308105469 	 kl mean: 8.548948287963867 	 loss mean: 135.2422332763672
nll mean: 126.49504089355469 	 kl mean: 8.548948287963867 	 loss mean: 135.0439910888672
nll mean: 126.60374450683594 	 kl mean: 8.548948287963867 	 loss mean: 135.15269470214844



                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.98it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.00it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 126.63882446289062 	 kl mean: 8.548948287963867 	 loss mean: 135.18777465820312
nll mean: 127.07242584228516 	 kl mean: 8.548948287963867 	 loss mean: 135.62136840820312
nll mean: 126.4033203125 	 kl mean: 8.548948287963867 	 loss mean: 134.9522705078125



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s]
 20%|██        | 2/10 [00:00<00:00, 14.13it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A

nll mean: 124.30824279785156 	 kl mean: 8.467986106872559 	 loss mean: 132.77622985839844
nll mean: 124.40848541259766 	 kl mean: 8.467986106872559 	 loss mean: 132.87646484375
nll mean: 124.05878448486328 	 kl mean: 8.467986106872559 	 loss mean: 132.52676391601562



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.08it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.07it/s][A

nll mean: 123.99456787109375 	 kl mean: 8.467986106872559 	 loss mean: 132.46255493164062
nll mean: 124.78880310058594 	 kl mean: 8.467986106872559 	 loss mean: 133.25677490234375
nll mean: 124.54109954833984 	 kl mean: 8.467986106872559 	 loss mean: 133.0090789794922



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.15it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A

nll mean: 124.45486450195312 	 kl mean: 8.467986106872559 	 loss mean: 132.9228515625
nll mean: 124.28008270263672 	 kl mean: 8.467986106872559 	 loss mean: 132.74807739257812
nll mean: 124.21658325195312 	 kl mean: 8.467986106872559 	 loss mean: 132.6845703125



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.57it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.05it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.25it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A

nll mean: 124.51312255859375 	 kl mean: 8.467986106872559 	 loss mean: 132.98110961914062
nll mean: 135.40765380859375 	 kl mean: 8.433950424194336 	 loss mean: 143.8415985107422
nll mean: 135.5928192138672 	 kl mean: 8.433950424194336 	 loss mean: 144.02676391601562
nll mean: 134.52273559570312 	 kl mean: 8.433950424194336 	 loss mean: 142.9566650390625
nll mean: 134.4905242919922 	 kl mean: 8.433950424194336 	 loss mean: 142.92446899414062



                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.02it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.84it/s][A

nll mean: 135.35740661621094 	 kl mean: 8.433950424194336 	 loss mean: 143.79135131835938
nll mean: 134.5955810546875 	 kl mean: 8.433950424194336 	 loss mean: 143.029541015625
nll mean: 135.2899932861328 	 kl mean: 8.433950424194336 	 loss mean: 143.72393798828125
nll mean: 135.60055541992188 	 kl mean: 8.433950424194336 	 loss mean: 144.03451538085938
nll mean: 135.28201293945312 	 kl mean: 8.433950424194336 	 loss mean: 143.71597290039062



                                              
100%|██████████| 10/10 [00:00<00:00, 24.68it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 24.86it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A

nll mean: 135.62393188476562 	 kl mean: 8.433950424194336 	 loss mean: 144.057861328125
nll mean: 106.54331970214844 	 kl mean: 8.522968292236328 	 loss mean: 115.06629180908203
nll mean: 107.62785339355469 	 kl mean: 8.522968292236328 	 loss mean: 116.15083312988281
nll mean: 107.02864074707031 	 kl mean: 8.522968292236328 	 loss mean: 115.55160522460938
nll mean: 106.88667297363281 	 kl mean: 8.522968292236328 	 loss mean: 115.4096450805664



                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.79it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.76it/s][A

nll mean: 106.40706634521484 	 kl mean: 8.522968292236328 	 loss mean: 114.93003845214844
nll mean: 107.16990661621094 	 kl mean: 8.522968292236328 	 loss mean: 115.69287109375
nll mean: 106.98698425292969 	 kl mean: 8.522968292236328 	 loss mean: 115.50996398925781
nll mean: 106.52195739746094 	 kl mean: 8.522968292236328 	 loss mean: 115.044921875
nll mean: 106.85529327392578 	 kl mean: 8.522968292236328 	 loss mean: 115.37826538085938



                                              
100%|██████████| 10/10 [00:00<00:00, 24.68it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
 20%|██        | 2/10 [00:00<00:00, 14.68it/s][A

nll mean: 106.60185241699219 	 kl mean: 8.522968292236328 	 loss mean: 115.12481689453125
nll mean: 129.85256958007812 	 kl mean: 9.290651321411133 	 loss mean: 139.14321899414062
nll mean: 129.9766845703125 	 kl mean: 9.290651321411133 	 loss mean: 139.267333984375



                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.65it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
                                              

nll mean: 130.15615844726562 	 kl mean: 9.290651321411133 	 loss mean: 139.44680786132812
nll mean: 130.50515747070312 	 kl mean: 9.290651321411133 	 loss mean: 139.79580688476562
nll mean: 130.33950805664062 	 kl mean: 9.290651321411133 	 loss mean: 139.63015747070312



 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.93it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.80it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A

nll mean: 129.8095703125 	 kl mean: 9.290651321411133 	 loss mean: 139.1002197265625
nll mean: 130.36325073242188 	 kl mean: 9.290651321411133 	 loss mean: 139.65390014648438
nll mean: 130.4308319091797 	 kl mean: 9.290651321411133 	 loss mean: 139.72149658203125
nll mean: 130.04458618164062 	 kl mean: 9.290651321411133 	 loss mean: 139.33523559570312



                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.74it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.92it/s][A

nll mean: 129.847900390625 	 kl mean: 9.290651321411133 	 loss mean: 139.1385498046875
nll mean: 130.32534790039062 	 kl mean: 8.917287826538086 	 loss mean: 139.24264526367188
nll mean: 130.28726196289062 	 kl mean: 8.917287826538086 	 loss mean: 139.2045440673828
nll mean: 130.2453155517578 	 kl mean: 8.917287826538086 	 loss mean: 139.16259765625
nll mean: 130.5444793701172 	 kl mean: 8.917287826538086 	 loss mean: 139.46176147460938


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.92it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.65it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.44it/s][A

nll mean: 131.73013305664062 	 kl mean: 8.917287826538086 	 loss mean: 140.6474151611328
nll mean: 130.50662231445312 	 kl mean: 8.917287826538086 	 loss mean: 139.4239044189453
nll mean: 130.43165588378906 	 kl mean: 8.917287826538086 	 loss mean: 139.34893798828125
nll mean: 130.08230590820312 	 kl mean: 8.917287826538086 	 loss mean: 138.99960327148438
nll mean: 130.48379516601562 	 kl mean: 8.917287826538086 	 loss mean: 139.4010772705078


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
100%|██████████| 10/10 [00:00<00:00, 21.28it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
 30%|███       | 3/10 [00:00<00:00, 24.87it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A

nll mean: 130.70980834960938 	 kl mean: 8.917287826538086 	 loss mean: 139.62709045410156
nll mean: 119.3216323852539 	 kl mean: 8.978694915771484 	 loss mean: 128.30032348632812
nll mean: 118.65310668945312 	 kl mean: 8.978694915771484 	 loss mean: 127.63180541992188
nll mean: 119.15789794921875 	 kl mean: 8.978694915771484 	 loss mean: 128.1365966796875
nll mean: 118.92654418945312 	 kl mean: 8.978694915771484 	 loss mean: 127.90524291992188



                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.74it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.78it/s][A

nll mean: 118.72903442382812 	 kl mean: 8.978694915771484 	 loss mean: 127.70773315429688
nll mean: 119.53915405273438 	 kl mean: 8.978694915771484 	 loss mean: 128.51785278320312
nll mean: 118.793212890625 	 kl mean: 8.978694915771484 	 loss mean: 127.77191162109375
nll mean: 119.3992919921875 	 kl mean: 8.978694915771484 	 loss mean: 128.37799072265625
nll mean: 119.1250991821289 	 kl mean: 8.978694915771484 	 loss mean: 128.1038055419922



                                               
100%|██████████| 10/10 [00:00<00:00, 24.70it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
 30%|███       | 3/10 [00:00<00:00, 21.81it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A

nll mean: 118.62727355957031 	 kl mean: 8.978694915771484 	 loss mean: 127.60595703125
nll mean: 139.67684936523438 	 kl mean: 9.232158660888672 	 loss mean: 148.9090118408203
nll mean: 140.60556030273438 	 kl mean: 9.232158660888672 	 loss mean: 149.8377227783203
nll mean: 140.90548706054688 	 kl mean: 9.232158660888672 	 loss mean: 150.13763427734375
nll mean: 140.38941955566406 	 kl mean: 9.232158660888672 	 loss mean: 149.62158203125



                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.51it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.47it/s][A

nll mean: 141.0498809814453 	 kl mean: 9.232158660888672 	 loss mean: 150.28204345703125
nll mean: 140.43560791015625 	 kl mean: 9.232158660888672 	 loss mean: 149.66775512695312
nll mean: 140.75680541992188 	 kl mean: 9.232158660888672 	 loss mean: 149.9889678955078
nll mean: 140.61611938476562 	 kl mean: 9.232158660888672 	 loss mean: 149.8482666015625
nll mean: 140.6328125 	 kl mean: 9.232158660888672 	 loss mean: 149.86495971679688



                                               
100%|██████████| 10/10 [00:00<00:00, 21.23it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
 20%|██        | 2/10 [00:00<00:00, 12.43it/s][A

nll mean: 140.42520141601562 	 kl mean: 9.232158660888672 	 loss mean: 149.65737915039062
nll mean: 119.85240173339844 	 kl mean: 9.261819839477539 	 loss mean: 129.1142120361328
nll mean: 119.6845703125 	 kl mean: 9.261819839477539 	 loss mean: 128.94638061523438



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.55it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s][A

nll mean: 120.02555847167969 	 kl mean: 9.261819839477539 	 loss mean: 129.28738403320312
nll mean: 119.78723907470703 	 kl mean: 9.261819839477539 	 loss mean: 129.049072265625
nll mean: 120.15743255615234 	 kl mean: 9.261819839477539 	 loss mean: 129.41925048828125



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.53it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.53it/s][A

nll mean: 120.1328125 	 kl mean: 9.261819839477539 	 loss mean: 129.39462280273438
nll mean: 119.29777526855469 	 kl mean: 9.261819839477539 	 loss mean: 128.55960083007812
nll mean: 120.19798278808594 	 kl mean: 9.261819839477539 	 loss mean: 129.4597930908203



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.54it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]

nll mean: 120.09439849853516 	 kl mean: 9.261819839477539 	 loss mean: 129.35621643066406
nll mean: 119.93760681152344 	 kl mean: 9.261819839477539 	 loss mean: 129.19943237304688
nll mean: 162.1737823486328 	 kl mean: 9.592727661132812 	 loss mean: 171.76651000976562



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s]
 20%|██        | 2/10 [00:00<00:00, 10.03it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.98it/s][A

nll mean: 161.5426025390625 	 kl mean: 9.592727661132812 	 loss mean: 171.1353302001953
nll mean: 161.73532104492188 	 kl mean: 9.592727661132812 	 loss mean: 171.32803344726562



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.71it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.92it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.91it/s][A

nll mean: 161.7616729736328 	 kl mean: 9.592727661132812 	 loss mean: 171.35440063476562
nll mean: 162.12710571289062 	 kl mean: 9.592727661132812 	 loss mean: 171.71983337402344



                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.84it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.87it/s][A
[A                                           

nll mean: 161.6136932373047 	 kl mean: 9.592727661132812 	 loss mean: 171.2064208984375
nll mean: 161.81011962890625 	 kl mean: 9.592727661132812 	 loss mean: 171.40284729003906


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.90it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.71it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.94it/s][A

nll mean: 162.2285614013672 	 kl mean: 9.592727661132812 	 loss mean: 171.8212890625
nll mean: 162.24110412597656 	 kl mean: 9.592727661132812 	 loss mean: 171.83383178710938
nll mean: 162.2284393310547 	 kl mean: 9.592727661132812 	 loss mean: 171.8211669921875



 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.00it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 40%|████      | 4/10 [00:00<00:00, 17.87it/s][A

nll mean: 134.84034729003906 	 kl mean: 8.218578338623047 	 loss mean: 143.05892944335938
nll mean: 135.4283447265625 	 kl mean: 8.218578338623047 	 loss mean: 143.64694213867188
nll mean: 134.5880126953125 	 kl mean: 8.218578338623047 	 loss mean: 142.80657958984375
nll mean: 134.76217651367188 	 kl mean: 8.218578338623047 	 loss mean: 142.98074340820312



                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 60%|██████    | 6/10 [00:00<00:00, 17.89it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 80%|████████  | 8/10 [00:00<00:00, 17.87it/s][A

nll mean: 134.78170776367188 	 kl mean: 8.218578338623047 	 loss mean: 143.00027465820312
nll mean: 134.87672424316406 	 kl mean: 8.218578338623047 	 loss mean: 143.09530639648438
nll mean: 134.57369995117188 	 kl mean: 8.218578338623047 	 loss mean: 142.79229736328125
nll mean: 134.45703125 	 kl mean: 8.218578338623047 	 loss mean: 142.67562866210938



                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.85it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 133.80860900878906 	 kl mean: 8.218578338623047 	 loss mean: 142.02719116210938
nll mean: 134.74032592773438 	 kl mean: 8.218578338623047 	 loss mean: 142.9589080810547
nll mean: 144.04611206054688 	 kl mean: 9.026832580566406 	 loss mean: 153.0729522705078


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 20%|██        | 2/10 [00:00<00:00, 10.74it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.77it/s][A

nll mean: 143.90875244140625 	 kl mean: 9.026832580566406 	 loss mean: 152.9355926513672
nll mean: 144.39144897460938 	 kl mean: 9.026832580566406 	 loss mean: 153.4182891845703
nll mean: 143.77072143554688 	 kl mean: 9.026832580566406 	 loss mean: 152.79754638671875


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 40%|████      | 4/10 [00:00<00:00, 10.77it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.78it/s][A

nll mean: 143.6954345703125 	 kl mean: 9.026832580566406 	 loss mean: 152.72227478027344
nll mean: 144.27981567382812 	 kl mean: 9.026832580566406 	 loss mean: 153.306640625
nll mean: 143.6116943359375 	 kl mean: 9.026832580566406 	 loss mean: 152.63853454589844


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.78it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.50it/s]
                                               [A
 39%|███▉      | 15/38 [00:10<00:15,  1.50it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.77it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.74it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 143.90087890625 	 kl mean: 9.026832580566406 	 loss mean: 152.92770385742188
nll mean: 144.08633422851562 	 kl mean: 9.026832580566406 	 loss mean: 153.1131591796875
nll mean: 143.6758575439453 	 kl mean: 9.026832580566406 	 loss mean: 152.70269775390625



                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s]
 30%|███       | 3/10 [00:00<00:00, 24.32it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A

nll mean: 145.16375732421875 	 kl mean: 8.253942489624023 	 loss mean: 153.41769409179688
nll mean: 144.59361267089844 	 kl mean: 8.253942489624023 	 loss mean: 152.84756469726562
nll mean: 145.52072143554688 	 kl mean: 8.253942489624023 	 loss mean: 153.774658203125
nll mean: 145.66407775878906 	 kl mean: 8.253942489624023 	 loss mean: 153.91802978515625
nll mean: 145.41510009765625 	 kl mean: 8.253942489624023 	 loss mean: 153.66903686523438



                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.27it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.34it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.44it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 24.44it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 145.19094848632812 	 kl mean: 8.253942489624023 	 loss mean: 153.44488525390625
nll mean: 144.8995361328125 	 kl mean: 8.253942489624023 	 loss mean: 153.15347290039062
nll mean: 144.9232635498047 	 kl mean: 8.253942489624023 	 loss mean: 153.17721557617188
nll mean: 144.6209716796875 	 kl mean: 8.253942489624023 	 loss mean: 152.87493896484375
nll mean: 145.02320861816406 	 kl mean: 8.253942489624023 	 loss mean: 153.27716064453125



                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 30%|███       | 3/10 [00:00<00:00, 24.91it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 30%|███       | 3/10 [00:00<00:00, 24.91it/s][A

nll mean: 133.31907653808594 	 kl mean: 8.894048690795898 	 loss mean: 142.213134765625
nll mean: 133.27420043945312 	 kl mean: 8.894048690795898 	 loss mean: 142.16824340820312
nll mean: 133.66323852539062 	 kl mean: 8.894048690795898 	 loss mean: 142.5572967529297
nll mean: 133.2024383544922 	 kl mean: 8.894048690795898 	 loss mean: 142.09649658203125
nll mean: 132.9210968017578 	 kl mean: 8.894048690795898 	 loss mean: 141.8151397705078
nll mean: 133.2307891845703 	 kl mean: 8.894048690795898 	 loss mean: 142.12484741210938


 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.96it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.55it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.04it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.02it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 132.9959716796875 	 kl mean: 8.894048690795898 	 loss mean: 141.8900146484375
nll mean: 132.81610107421875 	 kl mean: 8.894048690795898 	 loss mean: 141.71014404296875
nll mean: 132.7838592529297 	 kl mean: 8.894048690795898 	 loss mean: 141.67791748046875
nll mean: 133.4311981201172 	 kl mean: 8.894048690795898 	 loss mean: 142.3252410888672



                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.74it/s]
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s]
 20%|██        | 2/10 [00:00<00:00, 12.40it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A

nll mean: 128.8603515625 	 kl mean: 9.594253540039062 	 loss mean: 138.45460510253906
nll mean: 129.52919006347656 	 kl mean: 9.594253540039062 	 loss mean: 139.12344360351562
nll mean: 128.92660522460938 	 kl mean: 9.594253540039062 	 loss mean: 138.52085876464844



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.44it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.40it/s][A

nll mean: 129.331787109375 	 kl mean: 9.594253540039062 	 loss mean: 138.92604064941406
nll mean: 129.41812133789062 	 kl mean: 9.594253540039062 	 loss mean: 139.0123748779297
nll mean: 129.50515747070312 	 kl mean: 9.594253540039062 	 loss mean: 139.0994110107422



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.47it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A

nll mean: 129.3616943359375 	 kl mean: 9.594253540039062 	 loss mean: 138.95594787597656
nll mean: 128.76199340820312 	 kl mean: 9.594253540039062 	 loss mean: 138.3562469482422
nll mean: 129.70382690429688 	 kl mean: 9.594253540039062 	 loss mean: 139.29808044433594



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.74it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.49it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 12.72it/s][A

nll mean: 129.33766174316406 	 kl mean: 9.594253540039062 	 loss mean: 138.93191528320312
nll mean: 148.76739501953125 	 kl mean: 9.092965126037598 	 loss mean: 157.8603515625
nll mean: 148.02528381347656 	 kl mean: 9.092965126037598 	 loss mean: 157.11825561523438



                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.56it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.69it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s][A

nll mean: 148.78042602539062 	 kl mean: 9.092965126037598 	 loss mean: 157.87339782714844
nll mean: 147.83547973632812 	 kl mean: 9.092965126037598 	 loss mean: 156.92845153808594
nll mean: 148.60629272460938 	 kl mean: 9.092965126037598 	 loss mean: 157.69924926757812



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.68it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.59it/s][A

nll mean: 148.22813415527344 	 kl mean: 9.092965126037598 	 loss mean: 157.32110595703125
nll mean: 148.71339416503906 	 kl mean: 9.092965126037598 	 loss mean: 157.80636596679688
nll mean: 148.01254272460938 	 kl mean: 9.092965126037598 	 loss mean: 157.10549926757812



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.56it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.61it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]

nll mean: 148.68902587890625 	 kl mean: 9.092965126037598 	 loss mean: 157.781982421875
nll mean: 148.18246459960938 	 kl mean: 9.092965126037598 	 loss mean: 157.27542114257812
nll mean: 155.80831909179688 	 kl mean: 8.879578590393066 	 loss mean: 164.6879119873047



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 20%|██        | 2/10 [00:00<00:00, 12.52it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.53it/s][A

nll mean: 156.177490234375 	 kl mean: 8.879578590393066 	 loss mean: 165.05706787109375
nll mean: 155.63995361328125 	 kl mean: 8.879578590393066 	 loss mean: 164.51953125
nll mean: 156.30718994140625 	 kl mean: 8.879578590393066 	 loss mean: 165.186767578125



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.54it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s][A

nll mean: 156.2658233642578 	 kl mean: 8.879578590393066 	 loss mean: 165.14540100097656
nll mean: 156.23458862304688 	 kl mean: 8.879578590393066 	 loss mean: 165.11416625976562
nll mean: 156.16653442382812 	 kl mean: 8.879578590393066 	 loss mean: 165.04611206054688



                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.67it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.65it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 156.0921173095703 	 kl mean: 8.879578590393066 	 loss mean: 164.97169494628906
nll mean: 155.20672607421875 	 kl mean: 8.879578590393066 	 loss mean: 164.0863037109375
nll mean: 155.29220581054688 	 kl mean: 8.879578590393066 	 loss mean: 164.17178344726562


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 10.42it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.28it/s][A

nll mean: 116.90876770019531 	 kl mean: 8.992227554321289 	 loss mean: 125.9010009765625
nll mean: 116.81499481201172 	 kl mean: 8.992227554321289 	 loss mean: 125.80721282958984
nll mean: 116.52244567871094 	 kl mean: 8.992227554321289 	 loss mean: 125.51466369628906


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 30%|███       | 3/10 [00:00<00:00, 10.28it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.28it/s][A

nll mean: 116.5335922241211 	 kl mean: 8.992227554321289 	 loss mean: 125.52581787109375
nll mean: 116.68235778808594 	 kl mean: 8.992227554321289 	 loss mean: 125.6745834350586
nll mean: 117.34611511230469 	 kl mean: 8.992227554321289 	 loss mean: 126.33833312988281


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.39it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.28it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.26it/s][A
                                               [A

nll mean: 116.71054077148438 	 kl mean: 8.992227554321289 	 loss mean: 125.70276641845703
nll mean: 117.10469055175781 	 kl mean: 8.992227554321289 	 loss mean: 126.09691619873047



 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.39it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.13it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.20it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]

nll mean: 116.66556549072266 	 kl mean: 8.992227554321289 	 loss mean: 125.65779113769531
nll mean: 117.20166015625 	 kl mean: 8.992227554321289 	 loss mean: 126.19387817382812
nll mean: 106.61844635009766 	 kl mean: 7.871135711669922 	 loss mean: 114.48957824707031
nll mean: 106.70830535888672 	 kl mean: 7.871135711669922 	 loss mean: 114.5794448852539
nll mean: 106.57536315917969 	 kl mean: 7.871135711669922 	 loss mean: 114.44650268554688



                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 33.25it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
 80%|████████  | 8/10 [00:00<00:00, 33.02it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 32.80it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 106.56541442871094 	 kl mean: 7.871135711669922 	 loss mean: 114.43653869628906
nll mean: 106.52998352050781 	 kl mean: 7.871135711669922 	 loss mean: 114.401123046875
nll mean: 105.84693908691406 	 kl mean: 7.871135711669922 	 loss mean: 113.71807098388672
nll mean: 106.3298568725586 	 kl mean: 7.871135711669922 	 loss mean: 114.20098876953125
nll mean: 106.41925048828125 	 kl mean: 7.871135711669922 	 loss mean: 114.29039001464844
nll mean: 106.64276123046875 	 kl mean: 7.871135711669922 	 loss mean: 114.51390075683594
nll mean: 106.57242584228516 	 kl mean: 7.871135711669922 	 loss mean: 114.44355773925781


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.86it/s][A

nll mean: 159.56881713867188 	 kl mean: 8.631579399108887 	 loss mean: 168.2003936767578
nll mean: 158.51954650878906 	 kl mean: 8.631579399108887 	 loss mean: 167.151123046875
nll mean: 158.94882202148438 	 kl mean: 8.631579399108887 	 loss mean: 167.58041381835938


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.86it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 40%|████      | 4/10 [00:00<00:00, 14.79it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.74it/s][A

nll mean: 158.97283935546875 	 kl mean: 8.631579399108887 	 loss mean: 167.6044158935547
nll mean: 158.5875244140625 	 kl mean: 8.631579399108887 	 loss mean: 167.2191162109375
nll mean: 159.17041015625 	 kl mean: 8.631579399108887 	 loss mean: 167.802001953125


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.74it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.75it/s][A

nll mean: 159.19296264648438 	 kl mean: 8.631579399108887 	 loss mean: 167.8245391845703
nll mean: 158.87123107910156 	 kl mean: 8.631579399108887 	 loss mean: 167.5028076171875
nll mean: 159.03831481933594 	 kl mean: 8.631579399108887 	 loss mean: 167.66989135742188


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.75it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.65it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 22.08it/s][A

nll mean: 158.9643096923828 	 kl mean: 8.631579399108887 	 loss mean: 167.59588623046875
nll mean: 120.48883819580078 	 kl mean: 9.645225524902344 	 loss mean: 130.13406372070312
nll mean: 120.45694732666016 	 kl mean: 9.645225524902344 	 loss mean: 130.1021728515625
nll mean: 121.190185546875 	 kl mean: 9.645225524902344 	 loss mean: 130.83541870117188
nll mean: 121.04145050048828 	 kl mean: 9.645225524902344 	 loss mean: 130.68667602539062


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 22.08it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.84it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.59it/s][A

nll mean: 120.24607849121094 	 kl mean: 9.645225524902344 	 loss mean: 129.89129638671875
nll mean: 121.41801452636719 	 kl mean: 9.645225524902344 	 loss mean: 131.063232421875
nll mean: 121.09371948242188 	 kl mean: 9.645225524902344 	 loss mean: 130.73895263671875
nll mean: 121.20454406738281 	 kl mean: 9.645225524902344 	 loss mean: 130.84976196289062
nll mean: 120.91641235351562 	 kl mean: 9.645225524902344 	 loss mean: 130.5616455078125


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 21.39it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 14.57it/s][A

nll mean: 121.07318115234375 	 kl mean: 9.645225524902344 	 loss mean: 130.71841430664062
nll mean: 113.80826568603516 	 kl mean: 8.684402465820312 	 loss mean: 122.49266052246094
nll mean: 113.08885955810547 	 kl mean: 8.684402465820312 	 loss mean: 121.77325439453125



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.64it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A

nll mean: 113.12992858886719 	 kl mean: 8.684402465820312 	 loss mean: 121.81433868408203
nll mean: 113.5777359008789 	 kl mean: 8.684402465820312 	 loss mean: 122.26214599609375
nll mean: 113.20059204101562 	 kl mean: 8.684402465820312 	 loss mean: 121.88499450683594



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.66it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.74it/s][A

nll mean: 113.64930725097656 	 kl mean: 8.684402465820312 	 loss mean: 122.33370971679688
nll mean: 113.48300170898438 	 kl mean: 8.684402465820312 	 loss mean: 122.16739654541016
nll mean: 113.61094665527344 	 kl mean: 8.684402465820312 	 loss mean: 122.29534912109375



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.72it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]

nll mean: 113.07300567626953 	 kl mean: 8.684402465820312 	 loss mean: 121.75740814208984
nll mean: 113.3916015625 	 kl mean: 8.684402465820312 	 loss mean: 122.07601928710938
nll mean: 81.5157699584961 	 kl mean: 8.070981979370117 	 loss mean: 89.58674621582031
nll mean: 82.00787353515625 	 kl mean: 8.070981979370117 	 loss mean: 90.078857421875



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 22.20it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.33it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A

nll mean: 81.69039154052734 	 kl mean: 8.070981979370117 	 loss mean: 89.76138305664062
nll mean: 81.91302490234375 	 kl mean: 8.070981979370117 	 loss mean: 89.9840087890625
nll mean: 82.07723236083984 	 kl mean: 8.070981979370117 	 loss mean: 90.14822387695312
nll mean: 81.49783325195312 	 kl mean: 8.070981979370117 	 loss mean: 89.56880950927734
nll mean: 81.7490463256836 	 kl mean: 8.070981979370117 	 loss mean: 89.82003784179688



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.39it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 22.37it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 82.3133316040039 	 kl mean: 8.070981979370117 	 loss mean: 90.38430786132812
nll mean: 82.21379852294922 	 kl mean: 8.070981979370117 	 loss mean: 90.28477478027344
nll mean: 82.0564956665039 	 kl mean: 8.070981979370117 	 loss mean: 90.12747192382812
nll mean: 109.93301391601562 	 kl mean: 7.705066680908203 	 loss mean: 117.63807678222656
nll mean: 109.68540954589844 	 kl mean: 7.705066680908203 	 loss mean: 117.39047241210938


                                               
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:16<00:06,  1.74it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.92it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.66it/s][A

nll mean: 109.34913635253906 	 kl mean: 7.705066680908203 	 loss mean: 117.05419921875
nll mean: 109.87724304199219 	 kl mean: 7.705066680908203 	 loss mean: 117.58230590820312
nll mean: 109.64987182617188 	 kl mean: 7.705066680908203 	 loss mean: 117.35493469238281
nll mean: 110.26322174072266 	 kl mean: 7.705066680908203 	 loss mean: 117.9682846069336
nll mean: 109.81692504882812 	 kl mean: 7.705066680908203 	 loss mean: 117.5219955444336


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.66it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.74it/s]
100%|██████████| 10/10 [00:00<00:00, 21.42it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]

nll mean: 109.91191864013672 	 kl mean: 7.705066680908203 	 loss mean: 117.61698913574219
nll mean: 110.29527282714844 	 kl mean: 7.705066680908203 	 loss mean: 118.00033569335938
nll mean: 109.91249084472656 	 kl mean: 7.705066680908203 	 loss mean: 117.6175537109375
nll mean: 120.8437728881836 	 kl mean: 8.64830207824707 	 loss mean: 129.4920654296875



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.64it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.51it/s][A

nll mean: 121.30842590332031 	 kl mean: 8.64830207824707 	 loss mean: 129.95672607421875
nll mean: 121.06752014160156 	 kl mean: 8.64830207824707 	 loss mean: 129.7158203125
nll mean: 121.5269775390625 	 kl mean: 8.64830207824707 	 loss mean: 130.17527770996094



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.47it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A

nll mean: 121.22320556640625 	 kl mean: 8.64830207824707 	 loss mean: 129.87152099609375
nll mean: 120.80770874023438 	 kl mean: 8.64830207824707 	 loss mean: 129.4560089111328
nll mean: 121.37947845458984 	 kl mean: 8.64830207824707 	 loss mean: 130.0277862548828



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.36it/s][A
                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.37it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.45682525634766 	 kl mean: 8.64830207824707 	 loss mean: 129.10513305664062
nll mean: 121.38350677490234 	 kl mean: 8.64830207824707 	 loss mean: 130.03179931640625
nll mean: 121.25811767578125 	 kl mean: 8.64830207824707 	 loss mean: 129.90640258789062


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 10.27it/s][A

nll mean: 60.478546142578125 	 kl mean: 10.489347457885742 	 loss mean: 70.9678955078125
nll mean: 60.8944091796875 	 kl mean: 10.489347457885742 	 loss mean: 71.38375854492188
nll mean: 60.44683074951172 	 kl mean: 10.489347457885742 	 loss mean: 70.93617248535156


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 10.27it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 40%|████      | 4/10 [00:00<00:00, 10.21it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.23it/s][A

nll mean: 60.89582443237305 	 kl mean: 10.489347457885742 	 loss mean: 71.38516998291016
nll mean: 60.40278625488281 	 kl mean: 10.489347457885742 	 loss mean: 70.89213562011719
nll mean: 60.436729431152344 	 kl mean: 10.489347457885742 	 loss mean: 70.92607879638672


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.23it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.21it/s][A

nll mean: 60.76656723022461 	 kl mean: 10.489347457885742 	 loss mean: 71.25591278076172
nll mean: 60.26856231689453 	 kl mean: 10.489347457885742 	 loss mean: 70.7579116821289
nll mean: 60.81037902832031 	 kl mean: 10.489347457885742 	 loss mean: 71.29972839355469


                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.21it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.18it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 13.12it/s][A

nll mean: 61.21385192871094 	 kl mean: 10.489347457885742 	 loss mean: 71.70320129394531
nll mean: 104.10569763183594 	 kl mean: 9.336602210998535 	 loss mean: 113.44229888916016
nll mean: 103.5816650390625 	 kl mean: 9.336602210998535 	 loss mean: 112.91826629638672


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 13.12it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 40%|████      | 4/10 [00:00<00:00, 12.95it/s][A

nll mean: 103.62155151367188 	 kl mean: 9.336602210998535 	 loss mean: 112.9581527709961
nll mean: 103.56193542480469 	 kl mean: 9.336602210998535 	 loss mean: 112.89854431152344
nll mean: 104.03529357910156 	 kl mean: 9.336602210998535 	 loss mean: 113.37190246582031


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 40%|████      | 4/10 [00:00<00:00, 12.95it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.92it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.96it/s][A

nll mean: 103.99263763427734 	 kl mean: 9.336602210998535 	 loss mean: 113.32923126220703
nll mean: 103.74244689941406 	 kl mean: 9.336602210998535 	 loss mean: 113.07905578613281
nll mean: 103.96482849121094 	 kl mean: 9.336602210998535 	 loss mean: 113.30143737792969


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.37it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.96it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.89it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.34it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 82%|████████▏ | 31/38 [00:19<00:05,  1.34it/s]

nll mean: 103.98585510253906 	 kl mean: 9.336602210998535 	 loss mean: 113.32245635986328
nll mean: 103.91162109375 	 kl mean: 9.336602210998535 	 loss mean: 113.24822235107422
nll mean: 137.07125854492188 	 kl mean: 9.631765365600586 	 loss mean: 146.70303344726562



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 20%|██        | 2/10 [00:00<00:00, 10.27it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s][A
[A                                           

nll mean: 137.68185424804688 	 kl mean: 9.631765365600586 	 loss mean: 147.31362915039062
nll mean: 137.46310424804688 	 kl mean: 9.631765365600586 	 loss mean: 147.0948486328125


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.17it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s][A
                                               

nll mean: 137.61573791503906 	 kl mean: 9.631765365600586 	 loss mean: 147.24749755859375
nll mean: 137.65158081054688 	 kl mean: 9.631765365600586 	 loss mean: 147.28335571289062



 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.11it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.00it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s][A
                                               
 70%|███████   | 7/10 [00:00<00:00, 10.00it/s]

nll mean: 137.54019165039062 	 kl mean: 9.631765365600586 	 loss mean: 147.1719512939453
nll mean: 137.60247802734375 	 kl mean: 9.631765365600586 	 loss mean: 147.23423767089844
nll mean: 136.7757568359375 	 kl mean: 9.631765365600586 	 loss mean: 146.4075164794922
nll mean: 137.56317138671875 	 kl mean: 9.631765365600586 	 loss mean: 147.19493103027344


 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s]
 90%|█████████ | 9/10 [00:00<00:00, 10.00it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.34it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.99it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.22it/s]
 30%|███       | 3/10 [00:00<00:00, 26.00it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s][A
                                               


nll mean: 137.64822387695312 	 kl mean: 9.631765365600586 	 loss mean: 147.2799835205078
nll mean: 63.04759979248047 	 kl mean: 8.793890953063965 	 loss mean: 71.84149169921875
nll mean: 62.20345687866211 	 kl mean: 8.793890953063965 	 loss mean: 70.99734497070312
nll mean: 62.564483642578125 	 kl mean: 8.793890953063965 	 loss mean: 71.3583755493164
nll mean: 63.050071716308594 	 kl mean: 8.793890953063965 	 loss mean: 71.84395599365234
nll mean: 63.52234649658203 	 kl mean: 8.793890953063965 	 loss mean: 72.31623840332031


 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.65it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.22it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.49it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.28it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 63.047481536865234 	 kl mean: 8.793890953063965 	 loss mean: 71.84136962890625
nll mean: 62.77493667602539 	 kl mean: 8.793890953063965 	 loss mean: 71.56883239746094
nll mean: 62.838348388671875 	 kl mean: 8.793890953063965 	 loss mean: 71.63224029541016
nll mean: 62.90205001831055 	 kl mean: 8.793890953063965 	 loss mean: 71.69593811035156
nll mean: 62.321067810058594 	 kl mean: 8.793890953063965 	 loss mean: 71.1149673461914



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s]
 30%|███       | 3/10 [00:00<00:00, 21.35it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s][A

nll mean: 119.00816345214844 	 kl mean: 8.316097259521484 	 loss mean: 127.32425689697266
nll mean: 118.15679931640625 	 kl mean: 8.316097259521484 	 loss mean: 126.472900390625
nll mean: 118.25955200195312 	 kl mean: 8.316097259521484 	 loss mean: 126.57565307617188
nll mean: 118.88302612304688 	 kl mean: 8.316097259521484 	 loss mean: 127.1991195678711
nll mean: 118.53280639648438 	 kl mean: 8.316097259521484 	 loss mean: 126.84889221191406



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.37it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.44it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.39it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.41it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.47959899902344 	 kl mean: 8.316097259521484 	 loss mean: 126.79570007324219
nll mean: 117.9205093383789 	 kl mean: 8.316097259521484 	 loss mean: 126.23660278320312
nll mean: 118.87196350097656 	 kl mean: 8.316097259521484 	 loss mean: 127.18804931640625
nll mean: 118.40635681152344 	 kl mean: 8.316097259521484 	 loss mean: 126.72245025634766
nll mean: 118.04801940917969 	 kl mean: 8.316097259521484 	 loss mean: 126.36410522460938


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 12.50it/s][A

nll mean: 118.69530487060547 	 kl mean: 9.328603744506836 	 loss mean: 128.02391052246094
nll mean: 118.44457244873047 	 kl mean: 9.328603744506836 	 loss mean: 127.77317810058594
nll mean: 118.27716064453125 	 kl mean: 9.328603744506836 	 loss mean: 127.60577392578125


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 12.50it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 40%|████      | 4/10 [00:00<00:00, 12.63it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.71it/s][A

nll mean: 118.88426971435547 	 kl mean: 9.328603744506836 	 loss mean: 128.21286010742188
nll mean: 118.91912078857422 	 kl mean: 9.328603744506836 	 loss mean: 128.2477264404297
nll mean: 118.40028381347656 	 kl mean: 9.328603744506836 	 loss mean: 127.72888946533203


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.71it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.62it/s][A

nll mean: 119.06394958496094 	 kl mean: 9.328603744506836 	 loss mean: 128.39254760742188
nll mean: 118.99317932128906 	 kl mean: 9.328603744506836 	 loss mean: 128.32177734375
nll mean: 118.49577331542969 	 kl mean: 9.328603744506836 	 loss mean: 127.8243637084961


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.62it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.62it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 10.67it/s][A

nll mean: 118.52397918701172 	 kl mean: 9.328603744506836 	 loss mean: 127.85257720947266
nll mean: 112.76419830322266 	 kl mean: 8.443595886230469 	 loss mean: 121.2077865600586
nll mean: 112.89015197753906 	 kl mean: 8.443595886230469 	 loss mean: 121.33375549316406



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.62it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.48it/s][A

nll mean: 112.25843811035156 	 kl mean: 8.443595886230469 	 loss mean: 120.7020263671875
nll mean: 112.14346313476562 	 kl mean: 8.443595886230469 	 loss mean: 120.58706665039062
nll mean: 112.42825317382812 	 kl mean: 8.443595886230469 	 loss mean: 120.8718490600586



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.64it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.68it/s][A

nll mean: 112.4801025390625 	 kl mean: 8.443595886230469 	 loss mean: 120.9237060546875
nll mean: 112.36453247070312 	 kl mean: 8.443595886230469 	 loss mean: 120.80813598632812
nll mean: 112.24446868896484 	 kl mean: 8.443595886230469 	 loss mean: 120.68806457519531



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.48it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.64it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]

nll mean: 112.38014221191406 	 kl mean: 8.443595886230469 	 loss mean: 120.82373046875
nll mean: 112.43062591552734 	 kl mean: 8.443595886230469 	 loss mean: 120.87421417236328
nll mean: 111.95120239257812 	 kl mean: 8.60604476928711 	 loss mean: 120.5572509765625
nll mean: 110.9323959350586 	 kl mean: 8.60604476928711 	 loss mean: 119.53843688964844



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00, 21.71it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.50it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A

nll mean: 111.0925521850586 	 kl mean: 8.60604476928711 	 loss mean: 119.69859313964844
nll mean: 112.27764892578125 	 kl mean: 8.60604476928711 	 loss mean: 120.8836898803711
nll mean: 111.12150573730469 	 kl mean: 8.60604476928711 	 loss mean: 119.72755432128906
nll mean: 110.8399429321289 	 kl mean: 8.60604476928711 	 loss mean: 119.44599151611328
nll mean: 111.79197692871094 	 kl mean: 8.60604476928711 	 loss mean: 120.39802551269531



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.32it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.42it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.57it/s][A
 97%|█████████▋| 37/38 [00:23<00:00,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:23<00:00,  1.49it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]

nll mean: 111.1057357788086 	 kl mean: 8.60604476928711 	 loss mean: 119.71177673339844
nll mean: 111.11714935302734 	 kl mean: 8.60604476928711 	 loss mean: 119.72319793701172
nll mean: 111.28250122070312 	 kl mean: 8.60604476928711 	 loss mean: 119.8885498046875
nll mean: 85.12789154052734 	 kl mean: 9.783478736877441 	 loss mean: 94.91136169433594
nll mean: 86.32608032226562 	 kl mean: 9.783478736877441 	 loss mean: 96.10955810546875
nll mean: 86.29782104492188 	 kl mean: 9.783478736877441 	 loss mean: 96.081298828125



                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 30.50it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
 80%|████████  | 8/10 [00:00<00:00, 30.59it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.49it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 30.58it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.57it/s]


nll mean: 85.478759765625 	 kl mean: 9.783478736877441 	 loss mean: 95.26225280761719
nll mean: 85.66352844238281 	 kl mean: 9.783478736877441 	 loss mean: 95.44700622558594
nll mean: 85.50823211669922 	 kl mean: 9.783478736877441 	 loss mean: 95.29171752929688
nll mean: 84.8447494506836 	 kl mean: 9.783478736877441 	 loss mean: 94.62821960449219
nll mean: 85.38327026367188 	 kl mean: 9.783478736877441 	 loss mean: 95.166748046875
nll mean: 85.6609115600586 	 kl mean: 9.783478736877441 	 loss mean: 95.44438934326172
nll mean: 84.82850646972656 	 kl mean: 9.783478736877441 	 loss mean: 94.61198425292969
Approximate NLL:
tensor(121.2213, device='cuda:0')
Approximate KL:
tensor(8.8820, device='cuda:0')
Testing took 0:00:25.242807


  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .99it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .99it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .99it/s][A

nll mean: 110.04257202148438 	 kl mean: 9.663260459899902 	 loss mean: 119.7058334350586
nll mean: 110.21083068847656 	 kl mean: 9.663260459899902 	 loss mean: 119.87409210205078
nll mean: 109.63124084472656 	 kl mean: 9.663260459899902 	 loss mean: 119.29449462890625
nll mean: 110.09777069091797 	 kl mean: 9.663260459899902 	 loss mean: 119.76103210449219
nll mean: 110.02740478515625 	 kl mean: 9.663260459899902 	 loss mean: 119.690673828125



  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.99it/s][A
                                      .59it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .59it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .59it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 25.59it/s][A
                                      .04it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 24.65it/s][A
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 110.04421997070312 	 kl mean: 9.663260459899902 	 loss mean: 119.70748138427734
nll mean: 109.90673828125 	 kl mean: 9.663260459899902 	 loss mean: 119.56999969482422
nll mean: 110.00283813476562 	 kl mean: 9.663260459899902 	 loss mean: 119.66609954833984
nll mean: 109.69254302978516 	 kl mean: 9.663260459899902 	 loss mean: 119.35580444335938
nll mean: 109.79600524902344 	 kl mean: 9.663260459899902 	 loss mean: 119.45927429199219


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
 20%|██        | 2/10 [00:00<00:00, 13.47it/s][A

nll mean: 127.31707000732422 	 kl mean: 9.707560539245605 	 loss mean: 137.02462768554688
nll mean: 126.83366394042969 	 kl mean: 9.707560539245605 	 loss mean: 136.5412139892578
nll mean: 126.97555541992188 	 kl mean: 9.707560539245605 	 loss mean: 136.68312072753906


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
 20%|██        | 2/10 [00:00<00:00, 13.47it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
 40%|████      | 4/10 [00:00<00:00, 13.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.73it/s][A

nll mean: 127.17341613769531 	 kl mean: 9.707560539245605 	 loss mean: 136.8809814453125
nll mean: 127.2640151977539 	 kl mean: 9.707560539245605 	 loss mean: 136.9715576171875
nll mean: 126.97709655761719 	 kl mean: 9.707560539245605 	 loss mean: 136.68466186523438


                                              
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:15,  2.45it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.73it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:15,  2.45it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.75it/s][A

nll mean: 128.20553588867188 	 kl mean: 9.707560539245605 	 loss mean: 137.91310119628906
nll mean: 127.63165283203125 	 kl mean: 9.707560539245605 	 loss mean: 137.33920288085938
nll mean: 126.97059631347656 	 kl mean: 9.707560539245605 	 loss mean: 136.6781463623047


                                              
  3%|▎         | 1/38 [00:01<00:15,  2.45it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.75it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.83it/s][A
  5%|▌         | 2/38 [00:01<00:18,  1.99it/s]
                                              
  5%|▌         | 2/38 [00:01<00:18,  1.99it/s]
                                              
  5%|▌         | 2/38 [00:01<00:18,  1.99it/s]
                                              
  5%|▌         | 2/38 [00:01<00:18,  1.99it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:18,  1.99it/s]
 30%|███       | 3/10 [00:00<00:00, 24.37it/s][A

nll mean: 127.9188003540039 	 kl mean: 9.707560539245605 	 loss mean: 137.6263427734375
nll mean: 97.72916412353516 	 kl mean: 8.85894775390625 	 loss mean: 106.58811950683594
nll mean: 97.57283020019531 	 kl mean: 8.85894775390625 	 loss mean: 106.43177795410156
nll mean: 97.40377807617188 	 kl mean: 8.85894775390625 	 loss mean: 106.26272583007812
nll mean: 97.73249816894531 	 kl mean: 8.85894775390625 	 loss mean: 106.5914535522461


                                              
  5%|▌         | 2/38 [00:01<00:18,  1.99it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:18,  1.99it/s]
 30%|███       | 3/10 [00:00<00:00, 24.37it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:18,  1.99it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:18,  1.99it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:18,  1.99it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.42it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.43it/s][A

nll mean: 97.7662124633789 	 kl mean: 8.85894775390625 	 loss mean: 106.62516021728516
nll mean: 97.55416107177734 	 kl mean: 8.85894775390625 	 loss mean: 106.4131088256836
nll mean: 97.29788208007812 	 kl mean: 8.85894775390625 	 loss mean: 106.15682983398438
nll mean: 97.81509399414062 	 kl mean: 8.85894775390625 	 loss mean: 106.67404174804688
nll mean: 97.50653076171875 	 kl mean: 8.85894775390625 	 loss mean: 106.36548614501953


                                              
  5%|▌         | 2/38 [00:01<00:18,  1.99it/s]
100%|██████████| 10/10 [00:00<00:00, 24.45it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.75it/s][A

nll mean: 96.77145385742188 	 kl mean: 8.85894775390625 	 loss mean: 105.63040924072266
nll mean: 139.08053588867188 	 kl mean: 9.109256744384766 	 loss mean: 148.18978881835938
nll mean: 139.45401000976562 	 kl mean: 9.109256744384766 	 loss mean: 148.56326293945312


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
 20%|██        | 2/10 [00:00<00:00, 10.75it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 40%|████      | 4/10 [00:00<00:00, 10.78it/s][A

nll mean: 139.29150390625 	 kl mean: 9.109256744384766 	 loss mean: 148.40077209472656
nll mean: 139.23175048828125 	 kl mean: 9.109256744384766 	 loss mean: 148.3410186767578
nll mean: 140.11703491210938 	 kl mean: 9.109256744384766 	 loss mean: 149.22628784179688


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 40%|████      | 4/10 [00:00<00:00, 10.78it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.76it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.76it/s][A

nll mean: 138.37083435058594 	 kl mean: 9.109256744384766 	 loss mean: 147.48007202148438
nll mean: 138.98672485351562 	 kl mean: 9.109256744384766 	 loss mean: 148.09597778320312
nll mean: 138.59286499023438 	 kl mean: 9.109256744384766 	 loss mean: 147.70211791992188


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.76it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.75it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 138.89688110351562 	 kl mean: 9.109256744384766 	 loss mean: 148.00613403320312
nll mean: 139.66610717773438 	 kl mean: 9.109256744384766 	 loss mean: 148.77537536621094
nll mean: 127.83260345458984 	 kl mean: 8.676379203796387 	 loss mean: 136.5089874267578


                                              
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
 20%|██        | 2/10 [00:00<00:00, 14.35it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.21it/s][A

nll mean: 127.65303802490234 	 kl mean: 8.676379203796387 	 loss mean: 136.32940673828125
nll mean: 127.39410400390625 	 kl mean: 8.676379203796387 	 loss mean: 136.07049560546875
nll mean: 127.39370727539062 	 kl mean: 8.676379203796387 	 loss mean: 136.07008361816406


                                              
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
 40%|████      | 4/10 [00:00<00:00, 14.21it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.63it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.19it/s][A

nll mean: 127.51350402832031 	 kl mean: 8.676379203796387 	 loss mean: 136.18988037109375
nll mean: 127.16056823730469 	 kl mean: 8.676379203796387 	 loss mean: 135.83694458007812
nll mean: 127.2364273071289 	 kl mean: 8.676379203796387 	 loss mean: 135.91281127929688


                                              
 11%|█         | 4/38 [00:03<00:20,  1.63it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.19it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.63it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.63it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.18it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.22it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 127.64456939697266 	 kl mean: 8.676379203796387 	 loss mean: 136.32095336914062
nll mean: 127.09693145751953 	 kl mean: 8.676379203796387 	 loss mean: 135.7733154296875
nll mean: 127.43158721923828 	 kl mean: 8.676379203796387 	 loss mean: 136.10797119140625


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.50it/s][A

nll mean: 122.89643859863281 	 kl mean: 8.74917984008789 	 loss mean: 131.64561462402344
nll mean: 122.73145294189453 	 kl mean: 8.74917984008789 	 loss mean: 131.48062133789062
nll mean: 123.44874572753906 	 kl mean: 8.74917984008789 	 loss mean: 132.1979217529297


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.50it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 40%|████      | 4/10 [00:00<00:00, 14.26it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.28it/s][A

nll mean: 123.01017761230469 	 kl mean: 8.74917984008789 	 loss mean: 131.7593536376953
nll mean: 122.71975708007812 	 kl mean: 8.74917984008789 	 loss mean: 131.46893310546875
nll mean: 123.68753051757812 	 kl mean: 8.74917984008789 	 loss mean: 132.43670654296875


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.28it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.11it/s][A

nll mean: 122.67882537841797 	 kl mean: 8.74917984008789 	 loss mean: 131.42800903320312
nll mean: 122.71853637695312 	 kl mean: 8.74917984008789 	 loss mean: 131.46771240234375
nll mean: 123.66499328613281 	 kl mean: 8.74917984008789 	 loss mean: 132.4141845703125


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.11it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.12it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.48it/s][A

nll mean: 123.11724090576172 	 kl mean: 8.74917984008789 	 loss mean: 131.86642456054688
nll mean: 134.10931396484375 	 kl mean: 8.783447265625 	 loss mean: 142.89276123046875
nll mean: 135.21316528320312 	 kl mean: 8.783447265625 	 loss mean: 143.99659729003906
nll mean: 134.8575439453125 	 kl mean: 8.783447265625 	 loss mean: 143.64097595214844
nll mean: 135.0616455078125 	 kl mean: 8.783447265625 	 loss mean: 143.8450927734375


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.48it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.24it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.80it/s][A

nll mean: 134.71426391601562 	 kl mean: 8.783447265625 	 loss mean: 143.49769592285156
nll mean: 134.91574096679688 	 kl mean: 8.783447265625 	 loss mean: 143.69918823242188
nll mean: 135.16551208496094 	 kl mean: 8.783447265625 	 loss mean: 143.94895935058594
nll mean: 135.14443969726562 	 kl mean: 8.783447265625 	 loss mean: 143.92788696289062
nll mean: 134.9287109375 	 kl mean: 8.783447265625 	 loss mean: 143.712158203125


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 24.39it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
 30%|███       | 3/10 [00:00<00:00, 23.96it/s][A

nll mean: 135.62713623046875 	 kl mean: 8.783447265625 	 loss mean: 144.4105987548828
nll mean: 105.59517669677734 	 kl mean: 8.737151145935059 	 loss mean: 114.33232116699219
nll mean: 104.76031494140625 	 kl mean: 8.737151145935059 	 loss mean: 113.49746704101562
nll mean: 105.39830017089844 	 kl mean: 8.737151145935059 	 loss mean: 114.13545227050781
nll mean: 105.68689727783203 	 kl mean: 8.737151145935059 	 loss mean: 114.4240493774414


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
 30%|███       | 3/10 [00:00<00:00, 23.96it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.22it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.33it/s][A

nll mean: 105.27153015136719 	 kl mean: 8.737151145935059 	 loss mean: 114.00868225097656
nll mean: 104.879638671875 	 kl mean: 8.737151145935059 	 loss mean: 113.61679077148438
nll mean: 105.74407958984375 	 kl mean: 8.737151145935059 	 loss mean: 114.48123168945312
nll mean: 105.98649597167969 	 kl mean: 8.737151145935059 	 loss mean: 114.72364807128906
nll mean: 105.24341583251953 	 kl mean: 8.737151145935059 	 loss mean: 113.98056030273438


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
100%|██████████| 10/10 [00:00<00:00, 24.44it/s][A
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.86it/s][A

nll mean: 105.26213073730469 	 kl mean: 8.737151145935059 	 loss mean: 113.999267578125
nll mean: 130.26231384277344 	 kl mean: 9.707099914550781 	 loss mean: 139.96942138671875
nll mean: 130.4928741455078 	 kl mean: 9.707099914550781 	 loss mean: 140.19998168945312


                                              
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
 20%|██        | 2/10 [00:00<00:00, 14.86it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 40%|████      | 4/10 [00:00<00:00, 14.95it/s][A
 60%|██████    | 6/10 [00:00<00:00, 15.00it/s][A

nll mean: 130.45806884765625 	 kl mean: 9.707099914550781 	 loss mean: 140.16517639160156
nll mean: 130.49234008789062 	 kl mean: 9.707099914550781 	 loss mean: 140.19944763183594
nll mean: 130.3030242919922 	 kl mean: 9.707099914550781 	 loss mean: 140.0101318359375
nll mean: 130.3982391357422 	 kl mean: 9.707099914550781 	 loss mean: 140.1053466796875


                                              
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 60%|██████    | 6/10 [00:00<00:00, 15.00it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 80%|████████  | 8/10 [00:00<00:00, 15.11it/s]

nll mean: 130.4583282470703 	 kl mean: 9.707099914550781 	 loss mean: 140.16542053222656
nll mean: 130.56143188476562 	 kl mean: 9.707099914550781 	 loss mean: 140.26853942871094
nll mean: 130.6595916748047 	 kl mean: 9.707099914550781 	 loss mean: 140.36668395996094
nll mean: 130.80593872070312 	 kl mean: 9.707099914550781 	 loss mean: 140.51303100585938


[A
100%|██████████| 10/10 [00:00<00:00, 14.99it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.66it/s][A

nll mean: 130.20263671875 	 kl mean: 9.353462219238281 	 loss mean: 139.55609130859375
nll mean: 130.39369201660156 	 kl mean: 9.353462219238281 	 loss mean: 139.7471466064453
nll mean: 130.140625 	 kl mean: 9.353462219238281 	 loss mean: 139.49407958984375
nll mean: 130.5834197998047 	 kl mean: 9.353462219238281 	 loss mean: 139.9368896484375
nll mean: 130.28598022460938 	 kl mean: 9.353462219238281 	 loss mean: 139.6394500732422


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 30%|███       | 3/10 [00:00<00:00, 21.66it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.50it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.74it/s]
100%|██████████| 10/10 [00:00<00:00, 21.35it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 130.23095703125 	 kl mean: 9.353462219238281 	 loss mean: 139.58441162109375
nll mean: 130.18667602539062 	 kl mean: 9.353462219238281 	 loss mean: 139.54013061523438
nll mean: 130.14254760742188 	 kl mean: 9.353462219238281 	 loss mean: 139.49603271484375
nll mean: 130.50537109375 	 kl mean: 9.353462219238281 	 loss mean: 139.85882568359375
nll mean: 129.65512084960938 	 kl mean: 9.353462219238281 	 loss mean: 139.00857543945312


                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 30%|███       | 3/10 [00:00<00:00, 24.53it/s][A

nll mean: 120.99574279785156 	 kl mean: 9.549284934997559 	 loss mean: 130.54502868652344
nll mean: 120.37590789794922 	 kl mean: 9.549284934997559 	 loss mean: 129.92518615722656
nll mean: 120.38922119140625 	 kl mean: 9.549284934997559 	 loss mean: 129.93850708007812
nll mean: 120.28553009033203 	 kl mean: 9.549284934997559 	 loss mean: 129.83480834960938
nll mean: 119.81427001953125 	 kl mean: 9.549284934997559 	 loss mean: 129.36355590820312


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 30%|███       | 3/10 [00:00<00:00, 24.53it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.52it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.84it/s]
100%|██████████| 10/10 [00:00<00:00, 24.50it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.2159423828125 	 kl mean: 9.549284934997559 	 loss mean: 129.76522827148438
nll mean: 120.5390625 	 kl mean: 9.549284934997559 	 loss mean: 130.08834838867188
nll mean: 120.26042175292969 	 kl mean: 9.549284934997559 	 loss mean: 129.80970764160156
nll mean: 120.25056457519531 	 kl mean: 9.549284934997559 	 loss mean: 129.7998504638672
nll mean: 119.989013671875 	 kl mean: 9.549284934997559 	 loss mean: 129.53829956054688


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
 30%|███       | 3/10 [00:00<00:00, 21.73it/s][A

nll mean: 142.53079223632812 	 kl mean: 9.418910026550293 	 loss mean: 151.94970703125
nll mean: 142.26373291015625 	 kl mean: 9.418910026550293 	 loss mean: 151.68264770507812
nll mean: 142.49424743652344 	 kl mean: 9.418910026550293 	 loss mean: 151.9131622314453
nll mean: 142.82107543945312 	 kl mean: 9.418910026550293 	 loss mean: 152.239990234375
nll mean: 141.82887268066406 	 kl mean: 9.418910026550293 	 loss mean: 151.24777221679688


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
 30%|███       | 3/10 [00:00<00:00, 21.73it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.57it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
100%|██████████| 10/10 [00:00<00:00, 21.23it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 142.71697998046875 	 kl mean: 9.418910026550293 	 loss mean: 152.13589477539062
nll mean: 142.81008911132812 	 kl mean: 9.418910026550293 	 loss mean: 152.22900390625
nll mean: 142.8015899658203 	 kl mean: 9.418910026550293 	 loss mean: 152.2205047607422
nll mean: 142.77191162109375 	 kl mean: 9.418910026550293 	 loss mean: 152.19082641601562
nll mean: 142.42031860351562 	 kl mean: 9.418910026550293 	 loss mean: 151.8392333984375


                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 32%|███▏      | 12/38 [00:06<00:12,  2.02it/s]
 20%|██        | 2/10 [00:00<00:00, 12.61it/s][A

nll mean: 120.66764831542969 	 kl mean: 9.443309783935547 	 loss mean: 130.1109619140625
nll mean: 121.49871826171875 	 kl mean: 9.443309783935547 	 loss mean: 130.94203186035156
nll mean: 121.58799743652344 	 kl mean: 9.443309783935547 	 loss mean: 131.03131103515625


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 20%|██        | 2/10 [00:00<00:00, 12.61it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 40%|████      | 4/10 [00:00<00:00, 12.67it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.60it/s][A

nll mean: 121.10094451904297 	 kl mean: 9.443309783935547 	 loss mean: 130.54425048828125
nll mean: 121.31626892089844 	 kl mean: 9.443309783935547 	 loss mean: 130.75958251953125
nll mean: 121.1903305053711 	 kl mean: 9.443309783935547 	 loss mean: 130.63363647460938


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.60it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A

nll mean: 121.05461120605469 	 kl mean: 9.443309783935547 	 loss mean: 130.4979248046875
nll mean: 121.44340515136719 	 kl mean: 9.443309783935547 	 loss mean: 130.88671875
nll mean: 121.53959655761719 	 kl mean: 9.443309783935547 	 loss mean: 130.98291015625


                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.02it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.50it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:00,  9.77it/s][A

nll mean: 121.16400909423828 	 kl mean: 9.443309783935547 	 loss mean: 130.60731506347656
nll mean: 162.99012756347656 	 kl mean: 9.842243194580078 	 loss mean: 172.83236694335938


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
 10%|█         | 1/10 [00:00<00:00,  9.77it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
 20%|██        | 2/10 [00:00<00:00,  9.77it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.89it/s][A

nll mean: 163.25955200195312 	 kl mean: 9.842243194580078 	 loss mean: 173.101806640625
nll mean: 163.2494354248047 	 kl mean: 9.842243194580078 	 loss mean: 173.0916748046875
nll mean: 164.09043884277344 	 kl mean: 9.842243194580078 	 loss mean: 173.93267822265625


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 40%|████      | 4/10 [00:00<00:00,  9.89it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.88it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.85it/s][A

nll mean: 163.5236358642578 	 kl mean: 9.842243194580078 	 loss mean: 173.36587524414062
nll mean: 163.88912963867188 	 kl mean: 9.842243194580078 	 loss mean: 173.73135375976562


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.85it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.88it/s][A
                                               [A
                                              

nll mean: 163.5529327392578 	 kl mean: 9.842243194580078 	 loss mean: 173.39517211914062
nll mean: 164.14193725585938 	 kl mean: 9.842243194580078 	 loss mean: 173.9841766357422


 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s]
 80%|████████  | 8/10 [00:01<00:00,  9.89it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.92it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 163.63461303710938 	 kl mean: 9.842243194580078 	 loss mean: 173.47683715820312
nll mean: 163.79623413085938 	 kl mean: 9.842243194580078 	 loss mean: 173.6384735107422
nll mean: 136.63796997070312 	 kl mean: 8.622537612915039 	 loss mean: 145.260498046875


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.03it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 17.87it/s][A

nll mean: 136.86862182617188 	 kl mean: 8.622537612915039 	 loss mean: 145.49114990234375
nll mean: 137.3488006591797 	 kl mean: 8.622537612915039 	 loss mean: 145.97132873535156
nll mean: 136.77381896972656 	 kl mean: 8.622537612915039 	 loss mean: 145.39634704589844
nll mean: 136.5286865234375 	 kl mean: 8.622537612915039 	 loss mean: 145.15121459960938


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 40%|████      | 4/10 [00:00<00:00, 17.87it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 60%|██████    | 6/10 [00:00<00:00, 17.76it/s][A
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 17.74it/s][A

nll mean: 136.57701110839844 	 kl mean: 8.622537612915039 	 loss mean: 145.19955444335938
nll mean: 137.4666748046875 	 kl mean: 8.622537612915039 	 loss mean: 146.08920288085938
nll mean: 136.97218322753906 	 kl mean: 8.622537612915039 	 loss mean: 145.5947265625
nll mean: 138.23410034179688 	 kl mean: 8.622537612915039 	 loss mean: 146.85662841796875


                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s]
 80%|████████  | 8/10 [00:00<00:00, 17.74it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.68it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.73it/s][A

nll mean: 136.7127227783203 	 kl mean: 8.622537612915039 	 loss mean: 145.33526611328125
nll mean: 144.080810546875 	 kl mean: 9.906476974487305 	 loss mean: 153.98727416992188
nll mean: 144.20956420898438 	 kl mean: 9.906476974487305 	 loss mean: 154.1160430908203


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 20%|██        | 2/10 [00:00<00:00, 10.73it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 10.75it/s][A

nll mean: 144.6092529296875 	 kl mean: 9.906476974487305 	 loss mean: 154.51571655273438
nll mean: 144.65771484375 	 kl mean: 9.906476974487305 	 loss mean: 154.56417846679688
nll mean: 144.6168975830078 	 kl mean: 9.906476974487305 	 loss mean: 154.52337646484375


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 40%|████      | 4/10 [00:00<00:00, 10.75it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.74it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.66it/s][A

nll mean: 144.51473999023438 	 kl mean: 9.906476974487305 	 loss mean: 154.42120361328125
nll mean: 144.010009765625 	 kl mean: 9.906476974487305 	 loss mean: 153.91647338867188
nll mean: 143.96669006347656 	 kl mean: 9.906476974487305 	 loss mean: 153.8731689453125


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               [A
 39%|███▉      | 15/38 [00:10<00:15,  1.49it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.66it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.64it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 145.08395385742188 	 kl mean: 9.906476974487305 	 loss mean: 154.99041748046875
nll mean: 144.632080078125 	 kl mean: 9.906476974487305 	 loss mean: 154.53854370117188
nll mean: 144.6106719970703 	 kl mean: 8.486129760742188 	 loss mean: 153.0968017578125
nll mean: 145.22756958007812 	 kl mean: 8.486129760742188 	 loss mean: 153.71368408203125


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 24.06it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.07it/s][A

nll mean: 145.71182250976562 	 kl mean: 8.486129760742188 	 loss mean: 154.19796752929688
nll mean: 145.66189575195312 	 kl mean: 8.486129760742188 	 loss mean: 154.14804077148438
nll mean: 144.1856689453125 	 kl mean: 8.486129760742188 	 loss mean: 152.67178344726562
nll mean: 145.14840698242188 	 kl mean: 8.486129760742188 	 loss mean: 153.63455200195312
nll mean: 144.8855438232422 	 kl mean: 8.486129760742188 	 loss mean: 153.37167358398438


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.07it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
100%|██████████| 10/10 [00:00<00:00, 24.31it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 144.67825317382812 	 kl mean: 8.486129760742188 	 loss mean: 153.16439819335938
nll mean: 145.04771423339844 	 kl mean: 8.486129760742188 	 loss mean: 153.53384399414062
nll mean: 144.94989013671875 	 kl mean: 8.486129760742188 	 loss mean: 153.43601989746094
nll mean: 133.75428771972656 	 kl mean: 9.285539627075195 	 loss mean: 143.0398406982422
nll mean: 133.72946166992188 	 kl mean: 9.285539627075195 	 loss mean: 143.0150146484375


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 30%|███       | 3/10 [00:00<00:00, 24.99it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.90it/s][A

nll mean: 132.75357055664062 	 kl mean: 9.285539627075195 	 loss mean: 142.03912353515625
nll mean: 134.02749633789062 	 kl mean: 9.285539627075195 	 loss mean: 143.31304931640625
nll mean: 133.86727905273438 	 kl mean: 9.285539627075195 	 loss mean: 143.15283203125
nll mean: 132.86717224121094 	 kl mean: 9.285539627075195 	 loss mean: 142.1527099609375
nll mean: 133.88424682617188 	 kl mean: 9.285539627075195 	 loss mean: 143.1697998046875


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.90it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
100%|██████████| 10/10 [00:00<00:00, 24.68it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 133.864013671875 	 kl mean: 9.285539627075195 	 loss mean: 143.14955139160156
nll mean: 133.9927978515625 	 kl mean: 9.285539627075195 	 loss mean: 143.27835083007812
nll mean: 133.18963623046875 	 kl mean: 9.285539627075195 	 loss mean: 142.47515869140625
nll mean: 127.67005157470703 	 kl mean: 10.20283317565918 	 loss mean: 137.8728790283203


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 20%|██        | 2/10 [00:00<00:00, 12.34it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.44it/s][A

nll mean: 127.27281188964844 	 kl mean: 10.20283317565918 	 loss mean: 137.47564697265625
nll mean: 127.70323181152344 	 kl mean: 10.20283317565918 	 loss mean: 137.90606689453125
nll mean: 127.74337005615234 	 kl mean: 10.20283317565918 	 loss mean: 137.94619750976562


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 40%|████      | 4/10 [00:00<00:00, 12.44it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.53it/s][A

nll mean: 127.6219711303711 	 kl mean: 10.20283317565918 	 loss mean: 137.82479858398438
nll mean: 127.69497680664062 	 kl mean: 10.20283317565918 	 loss mean: 137.89781188964844
nll mean: 128.2748260498047 	 kl mean: 10.20283317565918 	 loss mean: 138.47764587402344


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.53it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.50it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.51it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 128.16098022460938 	 kl mean: 10.20283317565918 	 loss mean: 138.36380004882812
nll mean: 128.29605102539062 	 kl mean: 10.20283317565918 	 loss mean: 138.49888610839844
nll mean: 127.83492279052734 	 kl mean: 10.20283317565918 	 loss mean: 138.0377655029297


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 12.45it/s][A

nll mean: 150.68814086914062 	 kl mean: 9.467016220092773 	 loss mean: 160.1551513671875
nll mean: 150.79156494140625 	 kl mean: 9.467016220092773 	 loss mean: 160.25857543945312
nll mean: 150.3992462158203 	 kl mean: 9.467016220092773 	 loss mean: 159.86627197265625


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 12.45it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 40%|████      | 4/10 [00:00<00:00, 12.42it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.38it/s][A

nll mean: 150.41893005371094 	 kl mean: 9.467016220092773 	 loss mean: 159.8859405517578
nll mean: 150.70187377929688 	 kl mean: 9.467016220092773 	 loss mean: 160.1688690185547
nll mean: 150.22894287109375 	 kl mean: 9.467016220092773 	 loss mean: 159.69595336914062


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.38it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.41it/s][A

nll mean: 149.76248168945312 	 kl mean: 9.467016220092773 	 loss mean: 159.2294921875
nll mean: 150.7060546875 	 kl mean: 9.467016220092773 	 loss mean: 160.17308044433594
nll mean: 150.89398193359375 	 kl mean: 9.467016220092773 	 loss mean: 160.36099243164062


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.41it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.38it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.74it/s][A

nll mean: 150.06146240234375 	 kl mean: 9.467016220092773 	 loss mean: 159.52847290039062
nll mean: 157.67201232910156 	 kl mean: 9.331666946411133 	 loss mean: 167.00369262695312
nll mean: 157.06454467773438 	 kl mean: 9.331666946411133 	 loss mean: 166.39620971679688


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 20%|██        | 2/10 [00:00<00:00, 12.74it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 40%|████      | 4/10 [00:00<00:00, 12.61it/s][A

nll mean: 157.34823608398438 	 kl mean: 9.331666946411133 	 loss mean: 166.6798858642578
nll mean: 157.47750854492188 	 kl mean: 9.331666946411133 	 loss mean: 166.80917358398438
nll mean: 157.60153198242188 	 kl mean: 9.331666946411133 	 loss mean: 166.93319702148438


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 40%|████      | 4/10 [00:00<00:00, 12.61it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.49it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.44it/s][A

nll mean: 157.79693603515625 	 kl mean: 9.331666946411133 	 loss mean: 167.1285858154297
nll mean: 157.6202392578125 	 kl mean: 9.331666946411133 	 loss mean: 166.95191955566406
nll mean: 158.23597717285156 	 kl mean: 9.331666946411133 	 loss mean: 167.56764221191406


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.44it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.35it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 158.07009887695312 	 kl mean: 9.331666946411133 	 loss mean: 167.40176391601562
nll mean: 158.29098510742188 	 kl mean: 9.331666946411133 	 loss mean: 167.62265014648438
nll mean: 118.23612976074219 	 kl mean: 9.388838768005371 	 loss mean: 127.62495422363281


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 10.14it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.17it/s][A

nll mean: 117.46003723144531 	 kl mean: 9.388838768005371 	 loss mean: 126.84886932373047
nll mean: 118.22071075439453 	 kl mean: 9.388838768005371 	 loss mean: 127.60955810546875
nll mean: 117.85096740722656 	 kl mean: 9.388838768005371 	 loss mean: 127.23980712890625


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
 40%|████      | 4/10 [00:00<00:00, 10.17it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.20it/s][A

nll mean: 117.41478729248047 	 kl mean: 9.388838768005371 	 loss mean: 126.80362701416016
nll mean: 117.56046295166016 	 kl mean: 9.388838768005371 	 loss mean: 126.94930267333984
nll mean: 117.25909423828125 	 kl mean: 9.388838768005371 	 loss mean: 126.64793395996094


                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.20it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.18it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.18it/s][A

nll mean: 118.12953186035156 	 kl mean: 9.388838768005371 	 loss mean: 127.51836395263672
nll mean: 117.42916107177734 	 kl mean: 9.388838768005371 	 loss mean: 126.81800079345703
nll mean: 117.95623016357422 	 kl mean: 9.388838768005371 	 loss mean: 127.3450698852539



 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
 40%|████      | 4/10 [00:00<00:00, 33.03it/s][A

nll mean: 107.88448333740234 	 kl mean: 7.991828441619873 	 loss mean: 115.87631225585938
nll mean: 107.49208068847656 	 kl mean: 7.991828441619873 	 loss mean: 115.4839096069336
nll mean: 107.66032409667969 	 kl mean: 7.991828441619873 	 loss mean: 115.65216064453125
nll mean: 106.70001983642578 	 kl mean: 7.991828441619873 	 loss mean: 114.69184875488281
nll mean: 107.38553619384766 	 kl mean: 7.991828441619873 	 loss mean: 115.37736511230469
nll mean: 107.28065490722656 	 kl mean: 7.991828441619873 	 loss mean: 115.27249145507812
nll mean: 108.14115905761719 	 kl mean: 7.991828441619873 	 loss mean: 116.13298797607422


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
 40%|████      | 4/10 [00:00<00:00, 33.03it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
100%|██████████| 10/10 [00:00<00:00, 32.85it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]

nll mean: 107.41201782226562 	 kl mean: 7.991828441619873 	 loss mean: 115.40383911132812
nll mean: 107.20153045654297 	 kl mean: 7.991828441619873 	 loss mean: 115.193359375
nll mean: 106.5323257446289 	 kl mean: 7.991828441619873 	 loss mean: 114.52415466308594
nll mean: 162.5951385498047 	 kl mean: 8.905972480773926 	 loss mean: 171.50111389160156
nll mean: 162.77337646484375 	 kl mean: 8.905972480773926 	 loss mean: 171.67935180664062



  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
 20%|██        | 2/10 [00:00<00:00, 14.69it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
 40%|████      | 4/10 [00:00<00:00, 14.64it/s][A

nll mean: 162.6573028564453 	 kl mean: 8.905972480773926 	 loss mean: 171.5632781982422
nll mean: 162.4249267578125 	 kl mean: 8.905972480773926 	 loss mean: 171.3308868408203
nll mean: 162.3544464111328 	 kl mean: 8.905972480773926 	 loss mean: 171.26040649414062


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
 40%|████      | 4/10 [00:00<00:00, 14.64it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.69it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.77it/s][A

nll mean: 163.12086486816406 	 kl mean: 8.905972480773926 	 loss mean: 172.02684020996094
nll mean: 162.36785888671875 	 kl mean: 8.905972480773926 	 loss mean: 171.27383422851562
nll mean: 163.27886962890625 	 kl mean: 8.905972480773926 	 loss mean: 172.18484497070312


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.77it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.71it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 162.66571044921875 	 kl mean: 8.905972480773926 	 loss mean: 171.57168579101562
nll mean: 163.07809448242188 	 kl mean: 8.905972480773926 	 loss mean: 171.98406982421875
nll mean: 120.77395629882812 	 kl mean: 9.737552642822266 	 loss mean: 130.51150512695312
nll mean: 120.78065490722656 	 kl mean: 9.737552642822266 	 loss mean: 130.51821899414062


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
 30%|███       | 3/10 [00:00<00:00, 21.14it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.07it/s][A

nll mean: 121.53291320800781 	 kl mean: 9.737552642822266 	 loss mean: 131.2704620361328
nll mean: 121.36946868896484 	 kl mean: 9.737552642822266 	 loss mean: 131.1070098876953
nll mean: 121.3514404296875 	 kl mean: 9.737552642822266 	 loss mean: 131.0889892578125
nll mean: 121.77521514892578 	 kl mean: 9.737552642822266 	 loss mean: 131.5127716064453
nll mean: 121.03952026367188 	 kl mean: 9.737552642822266 	 loss mean: 130.77706909179688


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.07it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
100%|██████████| 10/10 [00:00<00:00, 21.05it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.64it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.87841033935547 	 kl mean: 9.737552642822266 	 loss mean: 130.615966796875
nll mean: 121.61595153808594 	 kl mean: 9.737552642822266 	 loss mean: 131.353515625
nll mean: 121.1261215209961 	 kl mean: 9.737552642822266 	 loss mean: 130.86367797851562
nll mean: 113.85139465332031 	 kl mean: 8.95240592956543 	 loss mean: 122.80380249023438


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.64it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s]
 20%|██        | 2/10 [00:00<00:00, 14.80it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.72it/s][A

nll mean: 113.891845703125 	 kl mean: 8.95240592956543 	 loss mean: 122.84424591064453
nll mean: 114.18716430664062 	 kl mean: 8.95240592956543 	 loss mean: 123.13957977294922
nll mean: 114.67450714111328 	 kl mean: 8.95240592956543 	 loss mean: 123.62691497802734


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s]
 40%|████      | 4/10 [00:00<00:00, 14.72it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.68it/s][A

nll mean: 114.16459655761719 	 kl mean: 8.95240592956543 	 loss mean: 123.11700439453125
nll mean: 113.66377258300781 	 kl mean: 8.95240592956543 	 loss mean: 122.6161880493164
nll mean: 114.74160766601562 	 kl mean: 8.95240592956543 	 loss mean: 123.69400787353516


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.68it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.64it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.73it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.71it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 114.25143432617188 	 kl mean: 8.95240592956543 	 loss mean: 123.20384979248047
nll mean: 114.45425415039062 	 kl mean: 8.95240592956543 	 loss mean: 123.40666198730469
nll mean: 113.8519287109375 	 kl mean: 8.95240592956543 	 loss mean: 122.80433654785156
nll mean: 83.18287658691406 	 kl mean: 7.879803657531738 	 loss mean: 91.06268310546875


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 22.98it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.74it/s][A

nll mean: 83.11091613769531 	 kl mean: 7.879803657531738 	 loss mean: 90.99072265625
nll mean: 82.65217590332031 	 kl mean: 7.879803657531738 	 loss mean: 90.531982421875
nll mean: 83.29987335205078 	 kl mean: 7.879803657531738 	 loss mean: 91.17967224121094
nll mean: 83.2857437133789 	 kl mean: 7.879803657531738 	 loss mean: 91.1655502319336
nll mean: 83.4755859375 	 kl mean: 7.879803657531738 	 loss mean: 91.35537719726562


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.74it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
100%|██████████| 10/10 [00:00<00:00, 22.22it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 82.83558654785156 	 kl mean: 7.879803657531738 	 loss mean: 90.71539306640625
nll mean: 82.89988708496094 	 kl mean: 7.879803657531738 	 loss mean: 90.77969360351562
nll mean: 82.94493103027344 	 kl mean: 7.879803657531738 	 loss mean: 90.82473754882812
nll mean: 83.5570297241211 	 kl mean: 7.879803657531738 	 loss mean: 91.43683624267578
nll mean: 109.74343872070312 	 kl mean: 8.123786926269531 	 loss mean: 117.86721801757812


                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.70it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.56it/s][A

nll mean: 110.15371704101562 	 kl mean: 8.123786926269531 	 loss mean: 118.27751159667969
nll mean: 110.23994445800781 	 kl mean: 8.123786926269531 	 loss mean: 118.36372375488281
nll mean: 109.85724639892578 	 kl mean: 8.123786926269531 	 loss mean: 117.98103332519531
nll mean: 109.86688232421875 	 kl mean: 8.123786926269531 	 loss mean: 117.99067687988281
nll mean: 110.4110107421875 	 kl mean: 8.123786926269531 	 loss mean: 118.53480529785156


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.56it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
100%|██████████| 10/10 [00:00<00:00, 21.50it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 109.86038208007812 	 kl mean: 8.123786926269531 	 loss mean: 117.98417663574219
nll mean: 109.81903076171875 	 kl mean: 8.123786926269531 	 loss mean: 117.94281768798828
nll mean: 110.24797821044922 	 kl mean: 8.123786926269531 	 loss mean: 118.37177276611328
nll mean: 109.49949645996094 	 kl mean: 8.123786926269531 	 loss mean: 117.62327575683594


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.35it/s][A

nll mean: 120.86250305175781 	 kl mean: 8.995282173156738 	 loss mean: 129.8577880859375
nll mean: 120.9697265625 	 kl mean: 8.995282173156738 	 loss mean: 129.9650115966797
nll mean: 121.32769012451172 	 kl mean: 8.995282173156738 	 loss mean: 130.32296752929688


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.35it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 40%|████      | 4/10 [00:00<00:00, 12.38it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.45it/s][A

nll mean: 120.55231475830078 	 kl mean: 8.995282173156738 	 loss mean: 129.547607421875
nll mean: 121.03804016113281 	 kl mean: 8.995282173156738 	 loss mean: 130.0333251953125
nll mean: 120.86399841308594 	 kl mean: 8.995282173156738 	 loss mean: 129.85928344726562


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.45it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.48it/s][A

nll mean: 120.38226318359375 	 kl mean: 8.995282173156738 	 loss mean: 129.37754821777344
nll mean: 120.89723205566406 	 kl mean: 8.995282173156738 	 loss mean: 129.89251708984375
nll mean: 120.68190002441406 	 kl mean: 8.995282173156738 	 loss mean: 129.67718505859375


                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.48it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.47it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 121.03126525878906 	 kl mean: 8.995282173156738 	 loss mean: 130.02655029296875
nll mean: 60.66228103637695 	 kl mean: 9.990961074829102 	 loss mean: 70.65324401855469


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 10.01it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.05it/s][A

nll mean: 60.95771026611328 	 kl mean: 9.990961074829102 	 loss mean: 70.94866943359375
nll mean: 61.49728012084961 	 kl mean: 9.990961074829102 	 loss mean: 71.48823547363281
nll mean: 60.575035095214844 	 kl mean: 9.990961074829102 	 loss mean: 70.56599426269531


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 40%|████      | 4/10 [00:00<00:00, 10.05it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
[A                                           

nll mean: 61.22233963012695 	 kl mean: 9.990961074829102 	 loss mean: 71.21330261230469
nll mean: 60.26074981689453 	 kl mean: 9.990961074829102 	 loss mean: 70.251708984375


 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.03it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.02it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s]


nll mean: 60.342227935791016 	 kl mean: 9.990961074829102 	 loss mean: 70.33318328857422
nll mean: 61.211517333984375 	 kl mean: 9.990961074829102 	 loss mean: 71.20248413085938
nll mean: 61.25715637207031 	 kl mean: 9.990961074829102 	 loss mean: 71.24810791015625


                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.99it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.06it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 13.32it/s][A

nll mean: 60.26464080810547 	 kl mean: 9.990961074829102 	 loss mean: 70.25559997558594
nll mean: 104.25397491455078 	 kl mean: 9.53155517578125 	 loss mean: 113.78553009033203
nll mean: 105.04536437988281 	 kl mean: 9.53155517578125 	 loss mean: 114.57691955566406


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 20%|██        | 2/10 [00:00<00:00, 13.32it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 40%|████      | 4/10 [00:00<00:00, 13.02it/s][A

nll mean: 104.35531616210938 	 kl mean: 9.53155517578125 	 loss mean: 113.88688659667969
nll mean: 104.86366271972656 	 kl mean: 9.53155517578125 	 loss mean: 114.39521789550781
nll mean: 104.50390625 	 kl mean: 9.53155517578125 	 loss mean: 114.03546142578125


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 40%|████      | 4/10 [00:00<00:00, 13.02it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.85it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.72it/s][A

nll mean: 104.45967864990234 	 kl mean: 9.53155517578125 	 loss mean: 113.9912338256836
nll mean: 104.41554260253906 	 kl mean: 9.53155517578125 	 loss mean: 113.94709777832031
nll mean: 104.40109252929688 	 kl mean: 9.53155517578125 	 loss mean: 113.93264770507812


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.72it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.59it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.33it/s]
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 104.34791564941406 	 kl mean: 9.53155517578125 	 loss mean: 113.87947082519531
nll mean: 104.94156646728516 	 kl mean: 9.53155517578125 	 loss mean: 114.4731216430664
nll mean: 138.45091247558594 	 kl mean: 9.861700057983398 	 loss mean: 148.3126220703125


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 20%|██        | 2/10 [00:00<00:00, 10.04it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]

nll mean: 138.11544799804688 	 kl mean: 9.861700057983398 	 loss mean: 147.97714233398438
nll mean: 138.01206970214844 	 kl mean: 9.861700057983398 	 loss mean: 147.873779296875
nll mean: 138.21011352539062 	 kl mean: 9.861700057983398 	 loss mean: 148.07180786132812



                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 10.03it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.02it/s][A
 70%|███████   | 7/10 [00:00<00:00, 10.07it/s][A

nll mean: 137.7341766357422 	 kl mean: 9.861700057983398 	 loss mean: 147.59588623046875
nll mean: 137.64634704589844 	 kl mean: 9.861700057983398 	 loss mean: 147.50804138183594
nll mean: 137.76791381835938 	 kl mean: 9.861700057983398 	 loss mean: 147.62960815429688


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.07it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.05it/s][A


nll mean: 137.51133728027344 	 kl mean: 9.861700057983398 	 loss mean: 147.37303161621094
nll mean: 139.0425262451172 	 kl mean: 9.861700057983398 	 loss mean: 148.90423583984375
nll mean: 138.40777587890625 	 kl mean: 9.861700057983398 	 loss mean: 148.26947021484375


100%|██████████| 10/10 [00:00<00:00, 10.05it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 30%|███       | 3/10 [00:00<00:00, 26.33it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.99it/s]

nll mean: 63.19398880004883 	 kl mean: 8.726312637329102 	 loss mean: 71.92030334472656
nll mean: 62.16017150878906 	 kl mean: 8.726312637329102 	 loss mean: 70.88648986816406
nll mean: 62.56786346435547 	 kl mean: 8.726312637329102 	 loss mean: 71.29417419433594
nll mean: 62.60143280029297 	 kl mean: 8.726312637329102 	 loss mean: 71.32774353027344
nll mean: 62.386207580566406 	 kl mean: 8.726312637329102 	 loss mean: 71.11251831054688
nll mean: 62.569610595703125 	 kl mean: 8.726312637329102 	 loss mean: 71.29591369628906


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.99it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
100%|██████████| 10/10 [00:00<00:00, 25.42it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 62.67937469482422 	 kl mean: 8.726312637329102 	 loss mean: 71.40568542480469
nll mean: 62.682891845703125 	 kl mean: 8.726312637329102 	 loss mean: 71.40919494628906
nll mean: 63.24190139770508 	 kl mean: 8.726312637329102 	 loss mean: 71.96821594238281
nll mean: 62.301513671875 	 kl mean: 8.726312637329102 	 loss mean: 71.02782440185547
nll mean: 119.33391571044922 	 kl mean: 8.391151428222656 	 loss mean: 127.72506713867188


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 30%|███       | 3/10 [00:00<00:00, 21.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.62it/s][A

nll mean: 119.76087188720703 	 kl mean: 8.391151428222656 	 loss mean: 128.1520233154297
nll mean: 119.84834289550781 	 kl mean: 8.391151428222656 	 loss mean: 128.239501953125
nll mean: 119.65579986572266 	 kl mean: 8.391151428222656 	 loss mean: 128.0469512939453
nll mean: 119.98863983154297 	 kl mean: 8.391151428222656 	 loss mean: 128.37979125976562
nll mean: 119.3055191040039 	 kl mean: 8.391151428222656 	 loss mean: 127.69667053222656


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.62it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
100%|██████████| 10/10 [00:00<00:00, 21.50it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 119.33384704589844 	 kl mean: 8.391151428222656 	 loss mean: 127.7249984741211
nll mean: 119.51406860351562 	 kl mean: 8.391151428222656 	 loss mean: 127.90520477294922
nll mean: 120.18923950195312 	 kl mean: 8.391151428222656 	 loss mean: 128.58038330078125
nll mean: 119.32134246826172 	 kl mean: 8.391151428222656 	 loss mean: 127.71249389648438


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 12.19it/s][A

nll mean: 120.44976806640625 	 kl mean: 9.459478378295898 	 loss mean: 129.9092559814453
nll mean: 120.06207275390625 	 kl mean: 9.459478378295898 	 loss mean: 129.5215606689453
nll mean: 119.63998413085938 	 kl mean: 9.459478378295898 	 loss mean: 129.09945678710938


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 20%|██        | 2/10 [00:00<00:00, 12.19it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 40%|████      | 4/10 [00:00<00:00, 12.29it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.34it/s][A

nll mean: 119.99983978271484 	 kl mean: 9.459478378295898 	 loss mean: 129.45932006835938
nll mean: 119.59791564941406 	 kl mean: 9.459478378295898 	 loss mean: 129.05738830566406
nll mean: 119.08688354492188 	 kl mean: 9.459478378295898 	 loss mean: 128.54635620117188


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.34it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.28it/s][A

nll mean: 119.56372833251953 	 kl mean: 9.459478378295898 	 loss mean: 129.023193359375
nll mean: 119.85787963867188 	 kl mean: 9.459478378295898 	 loss mean: 129.31735229492188
nll mean: 120.23719787597656 	 kl mean: 9.459478378295898 	 loss mean: 129.69668579101562


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.59it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.28it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.32it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.55it/s][A

nll mean: 119.67568969726562 	 kl mean: 9.459478378295898 	 loss mean: 129.1351776123047
nll mean: 113.49253845214844 	 kl mean: 8.799881935119629 	 loss mean: 122.29241943359375
nll mean: 113.83200073242188 	 kl mean: 8.799881935119629 	 loss mean: 122.63188171386719


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.55it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 10.57it/s][A

nll mean: 113.33421325683594 	 kl mean: 8.799881935119629 	 loss mean: 122.13410186767578
nll mean: 113.48199462890625 	 kl mean: 8.799881935119629 	 loss mean: 122.28187561035156
nll mean: 113.05732727050781 	 kl mean: 8.799881935119629 	 loss mean: 121.85720825195312


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 10.57it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.59it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.63it/s][A

nll mean: 113.2718505859375 	 kl mean: 8.799881935119629 	 loss mean: 122.07173156738281
nll mean: 113.57098388671875 	 kl mean: 8.799881935119629 	 loss mean: 122.37086486816406
nll mean: 112.86353302001953 	 kl mean: 8.799881935119629 	 loss mean: 121.66341400146484


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.63it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.62it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 113.25103759765625 	 kl mean: 8.799881935119629 	 loss mean: 122.0509262084961
nll mean: 112.86309814453125 	 kl mean: 8.799881935119629 	 loss mean: 121.66297912597656
nll mean: 111.85684204101562 	 kl mean: 8.624626159667969 	 loss mean: 120.4814682006836
nll mean: 112.3251724243164 	 kl mean: 8.624626159667969 	 loss mean: 120.94979858398438


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 21.52it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.38it/s][A

nll mean: 111.20196533203125 	 kl mean: 8.624626159667969 	 loss mean: 119.82658386230469
nll mean: 111.49966430664062 	 kl mean: 8.624626159667969 	 loss mean: 120.12428283691406
nll mean: 112.28227996826172 	 kl mean: 8.624626159667969 	 loss mean: 120.90690612792969
nll mean: 111.57048034667969 	 kl mean: 8.624626159667969 	 loss mean: 120.19509887695312
nll mean: 112.06230926513672 	 kl mean: 8.624626159667969 	 loss mean: 120.68693542480469


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.38it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
100%|██████████| 10/10 [00:00<00:00, 20.96it/s][A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 112.57350158691406 	 kl mean: 8.624626159667969 	 loss mean: 121.1981201171875
nll mean: 112.34774017333984 	 kl mean: 8.624626159667969 	 loss mean: 120.97236633300781
nll mean: 112.10977935791016 	 kl mean: 8.624626159667969 	 loss mean: 120.73440551757812
nll mean: 84.59303283691406 	 kl mean: 9.724547386169434 	 loss mean: 94.31756591796875
nll mean: 85.59878540039062 	 kl mean: 9.724547386169434 	 loss mean: 95.32334899902344
nll mean: 85.4688949584961 	 kl mean: 9.724547386169434 	 loss mean: 95.19344329833984



                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 30%|███       | 3/10 [00:00<00:00, 29.82it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
100%|██████████| 10/10 [00:00<00:00, 30.14it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.56it/s]


nll mean: 85.21656036376953 	 kl mean: 9.724547386169434 	 loss mean: 94.94110107421875
nll mean: 84.82884979248047 	 kl mean: 9.724547386169434 	 loss mean: 94.55340576171875
nll mean: 85.51634216308594 	 kl mean: 9.724547386169434 	 loss mean: 95.24087524414062
nll mean: 85.28791046142578 	 kl mean: 9.724547386169434 	 loss mean: 95.012451171875
nll mean: 85.0825424194336 	 kl mean: 9.724547386169434 	 loss mean: 94.80709075927734
nll mean: 85.6040267944336 	 kl mean: 9.724547386169434 	 loss mean: 95.32857513427734
nll mean: 85.3139419555664 	 kl mean: 9.724547386169434 	 loss mean: 95.03848266601562
Approximate NLL:
tensor(121.8890, device='cuda:0')
Approximate KL:
tensor(9.1538, device='cuda:0')
Testing took 0:00:25.386697


In [22]:
print(wd_fb_nlls)

[tensor(121.8104, device='cuda:0'), tensor(121.3209, device='cuda:0'), tensor(121.2213, device='cuda:0'), tensor(121.8890, device='cuda:0')]


# Word dropout & MDR

In [23]:
saved_model_files = get_model_filenames('word_dropout_066_mdr_10')
saved_model_files

['results_final/results0/word_dropout_066_mdr_10/models/sentence_vae_MDR_10.0_6000.pt',
 'results_final/results1/word_dropout_066_mdr_10/models/sentence_vae_MDR_10.0_6000.pt',
 'results_final/results2/word_dropout_066_mdr_10/models/sentence_vae_MDR_10.0_6000.pt',
 'results_final/results3/word_dropout_066_mdr_10/models/sentence_vae_MDR_10.0_4500.pt']

In [24]:
wd_mdr_nlls, wd_mdr_kls = get_approx_nlls(saved_model_files)

  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .55it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .55it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.55it/s][A

nll mean: 108.20780944824219 	 kl mean: 10.019697189331055 	 loss mean: 118.22750854492188
nll mean: 108.4472427368164 	 kl mean: 10.019697189331055 	 loss mean: 118.46693420410156
nll mean: 108.1527328491211 	 kl mean: 10.019697189331055 	 loss mean: 118.17243957519531
nll mean: 108.21694946289062 	 kl mean: 10.019697189331055 	 loss mean: 118.23664855957031
nll mean: 108.85493469238281 	 kl mean: 10.019697189331055 	 loss mean: 118.8746337890625


                                      
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.55it/s][A
                                      .21it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .21it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .21it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 25.21it/s][A
                                      .93it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 24.69it/s][A
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 109.30522155761719 	 kl mean: 10.019697189331055 	 loss mean: 119.32492065429688
nll mean: 108.63134765625 	 kl mean: 10.019697189331055 	 loss mean: 118.65103912353516
nll mean: 107.45580291748047 	 kl mean: 10.019697189331055 	 loss mean: 117.47549438476562
nll mean: 108.70138549804688 	 kl mean: 10.019697189331055 	 loss mean: 118.7210922241211
nll mean: 107.72859954833984 	 kl mean: 10.019697189331055 	 loss mean: 117.74829864501953



                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s]
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s]
 20%|██        | 2/10 [00:00<00:00, 14.64it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A

nll mean: 125.81468963623047 	 kl mean: 9.112685203552246 	 loss mean: 134.9273681640625
nll mean: 126.61222839355469 	 kl mean: 9.112685203552246 	 loss mean: 135.72491455078125
nll mean: 125.43644714355469 	 kl mean: 9.112685203552246 	 loss mean: 134.54913330078125



                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.34it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.27it/s][A

nll mean: 125.83395385742188 	 kl mean: 9.112685203552246 	 loss mean: 134.94662475585938
nll mean: 125.80613708496094 	 kl mean: 9.112685203552246 	 loss mean: 134.9188232421875
nll mean: 125.48638916015625 	 kl mean: 9.112685203552246 	 loss mean: 134.5990753173828



                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:15,  2.46it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.26it/s][A
                                              
  3%|▎         | 1/38 [00:01<00:15,  2.46it/s][A

nll mean: 126.06605529785156 	 kl mean: 9.112685203552246 	 loss mean: 135.17874145507812
nll mean: 125.8436508178711 	 kl mean: 9.112685203552246 	 loss mean: 134.95632934570312
nll mean: 125.9412841796875 	 kl mean: 9.112685203552246 	 loss mean: 135.053955078125



                                              
  3%|▎         | 1/38 [00:01<00:15,  2.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.11it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 24.61it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A

nll mean: 125.87368774414062 	 kl mean: 9.112685203552246 	 loss mean: 134.9863739013672
nll mean: 97.1436538696289 	 kl mean: 8.431262016296387 	 loss mean: 105.57490539550781
nll mean: 97.94739532470703 	 kl mean: 8.431262016296387 	 loss mean: 106.37865447998047
nll mean: 97.06139373779297 	 kl mean: 8.431262016296387 	 loss mean: 105.49266052246094
nll mean: 97.38990783691406 	 kl mean: 8.431262016296387 	 loss mean: 105.8211669921875



                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.61it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.56it/s][A

nll mean: 97.44905090332031 	 kl mean: 8.431262016296387 	 loss mean: 105.88031005859375
nll mean: 96.88758850097656 	 kl mean: 8.431262016296387 	 loss mean: 105.31885528564453
nll mean: 98.00318908691406 	 kl mean: 8.431262016296387 	 loss mean: 106.43444061279297
nll mean: 97.15967559814453 	 kl mean: 8.431262016296387 	 loss mean: 105.5909423828125
nll mean: 97.20411682128906 	 kl mean: 8.431262016296387 	 loss mean: 105.6353759765625



                                              
100%|██████████| 10/10 [00:00<00:00, 24.53it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
 20%|██        | 2/10 [00:00<00:00, 10.76it/s][A

nll mean: 97.71649932861328 	 kl mean: 8.431262016296387 	 loss mean: 106.14776611328125
nll mean: 137.51715087890625 	 kl mean: 8.918163299560547 	 loss mean: 146.435302734375
nll mean: 138.1865234375 	 kl mean: 8.918163299560547 	 loss mean: 147.1046905517578



                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.78it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s][A

nll mean: 138.07301330566406 	 kl mean: 8.918163299560547 	 loss mean: 146.99118041992188
nll mean: 137.63108825683594 	 kl mean: 8.918163299560547 	 loss mean: 146.5492401123047
nll mean: 137.76043701171875 	 kl mean: 8.918163299560547 	 loss mean: 146.67861938476562



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.75it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.74it/s][A

nll mean: 137.76536560058594 	 kl mean: 8.918163299560547 	 loss mean: 146.68353271484375
nll mean: 137.74990844726562 	 kl mean: 8.918163299560547 	 loss mean: 146.66806030273438
nll mean: 137.0753173828125 	 kl mean: 8.918163299560547 	 loss mean: 145.99346923828125



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.73it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 137.6015167236328 	 kl mean: 8.918163299560547 	 loss mean: 146.51968383789062
nll mean: 138.71340942382812 	 kl mean: 8.918163299560547 	 loss mean: 147.63157653808594
nll mean: 125.47826385498047 	 kl mean: 8.336587905883789 	 loss mean: 133.81484985351562


                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 20%|██        | 2/10 [00:00<00:00, 14.90it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.76it/s][A

nll mean: 125.50885009765625 	 kl mean: 8.336587905883789 	 loss mean: 133.84542846679688
nll mean: 125.857421875 	 kl mean: 8.336587905883789 	 loss mean: 134.19400024414062
nll mean: 126.12826538085938 	 kl mean: 8.336587905883789 	 loss mean: 134.46484375


                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 40%|████      | 4/10 [00:00<00:00, 14.76it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.38it/s][A

nll mean: 125.47534942626953 	 kl mean: 8.336587905883789 	 loss mean: 133.81195068359375
nll mean: 125.99801635742188 	 kl mean: 8.336587905883789 	 loss mean: 134.3345947265625
nll mean: 125.48299407958984 	 kl mean: 8.336587905883789 	 loss mean: 133.819580078125


                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.38it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.22it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.14it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 125.21495819091797 	 kl mean: 8.336587905883789 	 loss mean: 133.55154418945312
nll mean: 125.10282897949219 	 kl mean: 8.336587905883789 	 loss mean: 133.4394073486328
nll mean: 126.0124282836914 	 kl mean: 8.336587905883789 	 loss mean: 134.34902954101562



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.31it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 123.71867370605469 	 kl mean: 8.594341278076172 	 loss mean: 132.31301879882812
nll mean: 123.80345916748047 	 kl mean: 8.594341278076172 	 loss mean: 132.39779663085938
nll mean: 123.62598419189453 	 kl mean: 8.594341278076172 	 loss mean: 132.22032165527344



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.20it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.15it/s][A

nll mean: 122.84735107421875 	 kl mean: 8.594341278076172 	 loss mean: 131.44168090820312
nll mean: 123.34654998779297 	 kl mean: 8.594341278076172 	 loss mean: 131.94088745117188
nll mean: 123.30516052246094 	 kl mean: 8.594341278076172 	 loss mean: 131.89950561523438



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.17it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 123.53384399414062 	 kl mean: 8.594341278076172 	 loss mean: 132.12818908691406
nll mean: 123.22415161132812 	 kl mean: 8.594341278076172 	 loss mean: 131.81849670410156
nll mean: 123.58486938476562 	 kl mean: 8.594341278076172 	 loss mean: 132.17921447753906



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.10it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.27it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A

nll mean: 123.20835876464844 	 kl mean: 8.594341278076172 	 loss mean: 131.80270385742188
nll mean: 133.60548400878906 	 kl mean: 8.703181266784668 	 loss mean: 142.30865478515625
nll mean: 133.0620574951172 	 kl mean: 8.703181266784668 	 loss mean: 141.76522827148438
nll mean: 133.70855712890625 	 kl mean: 8.703181266784668 	 loss mean: 142.4117431640625
nll mean: 133.39573669433594 	 kl mean: 8.703181266784668 	 loss mean: 142.0989227294922



                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.11it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.27it/s][A

nll mean: 133.82839965820312 	 kl mean: 8.703181266784668 	 loss mean: 142.53158569335938
nll mean: 133.65997314453125 	 kl mean: 8.703181266784668 	 loss mean: 142.3631591796875
nll mean: 133.31192016601562 	 kl mean: 8.703181266784668 	 loss mean: 142.01510620117188
nll mean: 133.0492401123047 	 kl mean: 8.703181266784668 	 loss mean: 141.75241088867188
nll mean: 133.42160034179688 	 kl mean: 8.703181266784668 	 loss mean: 142.12478637695312



                                              
100%|██████████| 10/10 [00:00<00:00, 23.86it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s]
 30%|███       | 3/10 [00:00<00:00, 24.68it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s][A

nll mean: 133.5074462890625 	 kl mean: 8.703181266784668 	 loss mean: 142.21063232421875
nll mean: 106.03096008300781 	 kl mean: 8.746149063110352 	 loss mean: 114.77710723876953
nll mean: 105.10198974609375 	 kl mean: 8.746149063110352 	 loss mean: 113.84813690185547
nll mean: 105.62004852294922 	 kl mean: 8.746149063110352 	 loss mean: 114.36619567871094
nll mean: 105.99861907958984 	 kl mean: 8.746149063110352 	 loss mean: 114.74476623535156



                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.61it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.70it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.50it/s][A

nll mean: 105.83438110351562 	 kl mean: 8.746149063110352 	 loss mean: 114.58052825927734
nll mean: 105.38325500488281 	 kl mean: 8.746149063110352 	 loss mean: 114.12940979003906
nll mean: 105.64832305908203 	 kl mean: 8.746149063110352 	 loss mean: 114.39447021484375
nll mean: 105.14276123046875 	 kl mean: 8.746149063110352 	 loss mean: 113.88890838623047
nll mean: 105.540283203125 	 kl mean: 8.746149063110352 	 loss mean: 114.28643798828125



                                              
100%|██████████| 10/10 [00:00<00:00, 24.46it/s][A
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.53it/s][A

nll mean: 105.13859558105469 	 kl mean: 8.746149063110352 	 loss mean: 113.8847427368164
nll mean: 130.13894653320312 	 kl mean: 9.525592803955078 	 loss mean: 139.66455078125
nll mean: 130.86354064941406 	 kl mean: 9.525592803955078 	 loss mean: 140.38914489746094


                                              
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
 20%|██        | 2/10 [00:00<00:00, 14.53it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 40%|████      | 4/10 [00:00<00:00, 14.35it/s][A

nll mean: 130.9485321044922 	 kl mean: 9.525592803955078 	 loss mean: 140.47412109375
nll mean: 130.62135314941406 	 kl mean: 9.525592803955078 	 loss mean: 140.14694213867188
nll mean: 131.0183868408203 	 kl mean: 9.525592803955078 	 loss mean: 140.54397583007812


                                              
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 40%|████      | 4/10 [00:00<00:00, 14.35it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.55it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.89it/s][A

nll mean: 131.07913208007812 	 kl mean: 9.525592803955078 	 loss mean: 140.604736328125
nll mean: 131.04391479492188 	 kl mean: 9.525592803955078 	 loss mean: 140.5695037841797
nll mean: 130.5166778564453 	 kl mean: 9.525592803955078 	 loss mean: 140.04226684570312
nll mean: 130.8154296875 	 kl mean: 9.525592803955078 	 loss mean: 140.3410186767578


                                              
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.89it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.79it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.29it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A

nll mean: 130.89981079101562 	 kl mean: 9.525592803955078 	 loss mean: 140.42539978027344
nll mean: 129.55831909179688 	 kl mean: 9.363151550292969 	 loss mean: 138.92147827148438
nll mean: 129.1268310546875 	 kl mean: 9.363151550292969 	 loss mean: 138.489990234375
nll mean: 129.6611328125 	 kl mean: 9.363151550292969 	 loss mean: 139.0242919921875
nll mean: 129.19332885742188 	 kl mean: 9.363151550292969 	 loss mean: 138.55648803710938



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.22it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.24it/s][A

nll mean: 128.89105224609375 	 kl mean: 9.363151550292969 	 loss mean: 138.25421142578125
nll mean: 129.4889373779297 	 kl mean: 9.363151550292969 	 loss mean: 138.85208129882812
nll mean: 128.84320068359375 	 kl mean: 9.363151550292969 	 loss mean: 138.20635986328125
nll mean: 128.92623901367188 	 kl mean: 9.363151550292969 	 loss mean: 138.2893829345703
nll mean: 129.8215789794922 	 kl mean: 9.363151550292969 	 loss mean: 139.18472290039062



                                              
100%|██████████| 10/10 [00:00<00:00, 21.25it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.83it/s]
 30%|███       | 3/10 [00:00<00:00, 24.52it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A

nll mean: 129.11087036132812 	 kl mean: 9.363151550292969 	 loss mean: 138.47401428222656
nll mean: 118.5447998046875 	 kl mean: 9.372349739074707 	 loss mean: 127.91714477539062
nll mean: 118.36264038085938 	 kl mean: 9.372349739074707 	 loss mean: 127.7349853515625
nll mean: 118.23069763183594 	 kl mean: 9.372349739074707 	 loss mean: 127.60304260253906
nll mean: 118.37841796875 	 kl mean: 9.372349739074707 	 loss mean: 127.75076293945312



                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.51it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.83it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.51it/s][A

nll mean: 118.95022583007812 	 kl mean: 9.372349739074707 	 loss mean: 128.3225860595703
nll mean: 118.02139282226562 	 kl mean: 9.372349739074707 	 loss mean: 127.39374542236328
nll mean: 118.00727844238281 	 kl mean: 9.372349739074707 	 loss mean: 127.37962341308594
nll mean: 117.98089599609375 	 kl mean: 9.372349739074707 	 loss mean: 127.35324096679688
nll mean: 117.39946746826172 	 kl mean: 9.372349739074707 	 loss mean: 126.77182006835938



                                               
100%|██████████| 10/10 [00:00<00:00, 24.48it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s]
 30%|███       | 3/10 [00:00<00:00, 21.21it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A

nll mean: 118.16496276855469 	 kl mean: 9.372349739074707 	 loss mean: 127.53730773925781
nll mean: 139.9605712890625 	 kl mean: 9.317708015441895 	 loss mean: 149.27828979492188
nll mean: 140.17872619628906 	 kl mean: 9.317708015441895 	 loss mean: 149.49642944335938
nll mean: 139.67373657226562 	 kl mean: 9.317708015441895 	 loss mean: 148.991455078125
nll mean: 140.10153198242188 	 kl mean: 9.317708015441895 	 loss mean: 149.41925048828125



                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.34it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.98it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.27it/s][A

nll mean: 140.018798828125 	 kl mean: 9.317708015441895 	 loss mean: 149.33651733398438
nll mean: 139.6107177734375 	 kl mean: 9.317708015441895 	 loss mean: 148.9284210205078
nll mean: 139.79583740234375 	 kl mean: 9.317708015441895 	 loss mean: 149.113525390625
nll mean: 139.77520751953125 	 kl mean: 9.317708015441895 	 loss mean: 149.09292602539062
nll mean: 139.22508239746094 	 kl mean: 9.317708015441895 	 loss mean: 148.54278564453125



                                               
100%|██████████| 10/10 [00:00<00:00, 21.19it/s][A
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s]
 20%|██        | 2/10 [00:00<00:00, 12.60it/s][A

nll mean: 139.87696838378906 	 kl mean: 9.317708015441895 	 loss mean: 149.19468688964844
nll mean: 119.56687927246094 	 kl mean: 9.454336166381836 	 loss mean: 129.02120971679688
nll mean: 118.91106414794922 	 kl mean: 9.454336166381836 	 loss mean: 128.3654022216797



                                               
 32%|███▏      | 12/38 [00:06<00:12,  2.01it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.60it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A

nll mean: 119.75541687011719 	 kl mean: 9.454336166381836 	 loss mean: 129.20974731445312
nll mean: 119.77056121826172 	 kl mean: 9.454336166381836 	 loss mean: 129.22488403320312
nll mean: 119.47828674316406 	 kl mean: 9.454336166381836 	 loss mean: 128.9326171875



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.59it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.58it/s][A

nll mean: 119.20793151855469 	 kl mean: 9.454336166381836 	 loss mean: 128.6622772216797
nll mean: 119.96566772460938 	 kl mean: 9.454336166381836 	 loss mean: 129.41998291015625
nll mean: 119.75332641601562 	 kl mean: 9.454336166381836 	 loss mean: 129.20767211914062



                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:12,  2.01it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.51it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]

nll mean: 119.35951232910156 	 kl mean: 9.454336166381836 	 loss mean: 128.81385803222656
nll mean: 119.30900573730469 	 kl mean: 9.454336166381836 	 loss mean: 128.76333618164062
nll mean: 161.25509643554688 	 kl mean: 9.65589714050293 	 loss mean: 170.91099548339844



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s]
 20%|██        | 2/10 [00:00<00:00, 10.01it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.97it/s][A

nll mean: 161.67031860351562 	 kl mean: 9.65589714050293 	 loss mean: 171.32623291015625
nll mean: 160.96041870117188 	 kl mean: 9.65589714050293 	 loss mean: 170.61631774902344



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.70it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.90it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.88it/s][A

nll mean: 161.03292846679688 	 kl mean: 9.65589714050293 	 loss mean: 170.68882751464844
nll mean: 160.7555694580078 	 kl mean: 9.65589714050293 	 loss mean: 170.41148376464844



                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.84it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.86it/s][A


nll mean: 160.819580078125 	 kl mean: 9.65589714050293 	 loss mean: 170.47549438476562
nll mean: 161.064697265625 	 kl mean: 9.65589714050293 	 loss mean: 170.7205810546875


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.85it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
[A                                           

nll mean: 160.98452758789062 	 kl mean: 9.65589714050293 	 loss mean: 170.64044189453125
nll mean: 160.73094177246094 	 kl mean: 9.65589714050293 	 loss mean: 170.38682556152344


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.70it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.87it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s]
 20%|██        | 2/10 [00:00<00:00, 18.33it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A

nll mean: 161.1733856201172 	 kl mean: 9.65589714050293 	 loss mean: 170.82928466796875
nll mean: 135.46096801757812 	 kl mean: 8.687883377075195 	 loss mean: 144.1488494873047
nll mean: 134.866455078125 	 kl mean: 8.687883377075195 	 loss mean: 143.55435180664062
nll mean: 135.24700927734375 	 kl mean: 8.687883377075195 	 loss mean: 143.93487548828125



                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 40%|████      | 4/10 [00:00<00:00, 18.12it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A
 60%|██████    | 6/10 [00:00<00:00, 18.02it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.40it/s][A

nll mean: 135.2344970703125 	 kl mean: 8.687883377075195 	 loss mean: 143.92239379882812
nll mean: 134.80401611328125 	 kl mean: 8.687883377075195 	 loss mean: 143.49191284179688
nll mean: 135.94091796875 	 kl mean: 8.687883377075195 	 loss mean: 144.62879943847656
nll mean: 135.5600128173828 	 kl mean: 8.687883377075195 	 loss mean: 144.24790954589844



                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
 80%|████████  | 8/10 [00:00<00:00, 18.00it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.40it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.87it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 134.88238525390625 	 kl mean: 8.687883377075195 	 loss mean: 143.5702667236328
nll mean: 136.45079040527344 	 kl mean: 8.687883377075195 	 loss mean: 145.138671875
nll mean: 135.69012451171875 	 kl mean: 8.687883377075195 	 loss mean: 144.3780059814453



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 20%|██        | 2/10 [00:00<00:00, 10.76it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A

nll mean: 143.44851684570312 	 kl mean: 9.467691421508789 	 loss mean: 152.91622924804688
nll mean: 142.92112731933594 	 kl mean: 9.467691421508789 	 loss mean: 152.38882446289062
nll mean: 142.59698486328125 	 kl mean: 9.467691421508789 	 loss mean: 152.06468200683594



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.77it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.81it/s][A

nll mean: 142.46864318847656 	 kl mean: 9.467691421508789 	 loss mean: 151.93634033203125
nll mean: 142.7498779296875 	 kl mean: 9.467691421508789 	 loss mean: 152.21755981445312
nll mean: 143.37498474121094 	 kl mean: 9.467691421508789 	 loss mean: 152.84266662597656



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.78it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A

nll mean: 142.46121215820312 	 kl mean: 9.467691421508789 	 loss mean: 151.9289093017578
nll mean: 142.86441040039062 	 kl mean: 9.467691421508789 	 loss mean: 152.3321075439453
nll mean: 143.4736328125 	 kl mean: 9.467691421508789 	 loss mean: 152.94131469726562



                                               
 39%|███▉      | 15/38 [00:10<00:15,  1.49it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.74it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 24.73it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A

nll mean: 143.11244201660156 	 kl mean: 9.467691421508789 	 loss mean: 152.58013916015625
nll mean: 143.33865356445312 	 kl mean: 8.298538208007812 	 loss mean: 151.63717651367188
nll mean: 143.3238067626953 	 kl mean: 8.298538208007812 	 loss mean: 151.62234497070312
nll mean: 143.38583374023438 	 kl mean: 8.298538208007812 	 loss mean: 151.6843719482422
nll mean: 143.64132690429688 	 kl mean: 8.298538208007812 	 loss mean: 151.93984985351562



                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.62it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.48it/s][A

nll mean: 143.71127319335938 	 kl mean: 8.298538208007812 	 loss mean: 152.00979614257812
nll mean: 143.70216369628906 	 kl mean: 8.298538208007812 	 loss mean: 152.00070190429688
nll mean: 143.0716094970703 	 kl mean: 8.298538208007812 	 loss mean: 151.37014770507812
nll mean: 143.01577758789062 	 kl mean: 8.298538208007812 	 loss mean: 151.31430053710938
nll mean: 143.7925567626953 	 kl mean: 8.298538208007812 	 loss mean: 152.09109497070312



                                               
100%|██████████| 10/10 [00:00<00:00, 24.36it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 30%|███       | 3/10 [00:00<00:00, 24.63it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A

nll mean: 143.8207244873047 	 kl mean: 8.298538208007812 	 loss mean: 152.1192626953125
nll mean: 133.02801513671875 	 kl mean: 8.868478775024414 	 loss mean: 141.89651489257812
nll mean: 133.31024169921875 	 kl mean: 8.868478775024414 	 loss mean: 142.1787109375
nll mean: 132.60714721679688 	 kl mean: 8.868478775024414 	 loss mean: 141.47561645507812
nll mean: 133.02798461914062 	 kl mean: 8.868478775024414 	 loss mean: 141.89645385742188



                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.58it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.46it/s][A

nll mean: 132.7359619140625 	 kl mean: 8.868478775024414 	 loss mean: 141.60443115234375
nll mean: 133.10018920898438 	 kl mean: 8.868478775024414 	 loss mean: 141.96865844726562
nll mean: 133.3192901611328 	 kl mean: 8.868478775024414 	 loss mean: 142.18777465820312
nll mean: 133.36337280273438 	 kl mean: 8.868478775024414 	 loss mean: 142.23184204101562
nll mean: 132.9185791015625 	 kl mean: 8.868478775024414 	 loss mean: 141.78707885742188



                                               
100%|██████████| 10/10 [00:00<00:00, 24.43it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 20%|██        | 2/10 [00:00<00:00, 12.52it/s][A

nll mean: 134.00636291503906 	 kl mean: 8.868478775024414 	 loss mean: 142.8748321533203
nll mean: 128.089111328125 	 kl mean: 9.578315734863281 	 loss mean: 137.6674346923828
nll mean: 127.89994812011719 	 kl mean: 9.578315734863281 	 loss mean: 137.478271484375



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.45it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A

nll mean: 127.93446350097656 	 kl mean: 9.578315734863281 	 loss mean: 137.51278686523438
nll mean: 127.84150695800781 	 kl mean: 9.578315734863281 	 loss mean: 137.41983032226562
nll mean: 127.70337677001953 	 kl mean: 9.578315734863281 	 loss mean: 137.2816925048828



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.46it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A

nll mean: 128.74066162109375 	 kl mean: 9.578315734863281 	 loss mean: 138.3189697265625
nll mean: 128.0910186767578 	 kl mean: 9.578315734863281 	 loss mean: 137.66932678222656
nll mean: 128.57362365722656 	 kl mean: 9.578315734863281 	 loss mean: 138.1519317626953



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.53it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]

nll mean: 127.78154754638672 	 kl mean: 9.578315734863281 	 loss mean: 137.35986328125
nll mean: 127.82727813720703 	 kl mean: 9.578315734863281 	 loss mean: 137.40557861328125
nll mean: 148.9134521484375 	 kl mean: 9.304128646850586 	 loss mean: 158.21759033203125



                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 12.74it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.75it/s][A

nll mean: 147.98406982421875 	 kl mean: 9.304128646850586 	 loss mean: 157.2882080078125
nll mean: 147.57275390625 	 kl mean: 9.304128646850586 	 loss mean: 156.8768768310547
nll mean: 148.3994140625 	 kl mean: 9.304128646850586 	 loss mean: 157.70355224609375



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.64it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A

nll mean: 147.90081787109375 	 kl mean: 9.304128646850586 	 loss mean: 157.2049560546875
nll mean: 148.22828674316406 	 kl mean: 9.304128646850586 	 loss mean: 157.53240966796875
nll mean: 147.69969177246094 	 kl mean: 9.304128646850586 	 loss mean: 157.00381469726562



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.59it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.51it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 147.90081787109375 	 kl mean: 9.304128646850586 	 loss mean: 157.20494079589844
nll mean: 148.02328491210938 	 kl mean: 9.304128646850586 	 loss mean: 157.327392578125
nll mean: 148.22300720214844 	 kl mean: 9.304128646850586 	 loss mean: 157.5271453857422



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s]
 20%|██        | 2/10 [00:00<00:00, 12.66it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s][A

nll mean: 157.142822265625 	 kl mean: 8.724832534790039 	 loss mean: 165.86764526367188
nll mean: 156.9698486328125 	 kl mean: 8.724832534790039 	 loss mean: 165.69468688964844
nll mean: 157.0855712890625 	 kl mean: 8.724832534790039 	 loss mean: 165.81040954589844



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.62it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.45it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.56it/s][A

nll mean: 156.68385314941406 	 kl mean: 8.724832534790039 	 loss mean: 165.40869140625
nll mean: 157.57095336914062 	 kl mean: 8.724832534790039 	 loss mean: 166.29580688476562
nll mean: 156.72853088378906 	 kl mean: 8.724832534790039 	 loss mean: 165.45335388183594



                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.49it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s][A

nll mean: 157.27548217773438 	 kl mean: 8.724832534790039 	 loss mean: 166.00030517578125
nll mean: 156.52261352539062 	 kl mean: 8.724832534790039 	 loss mean: 165.2474365234375
nll mean: 157.4268798828125 	 kl mean: 8.724832534790039 	 loss mean: 166.15171813964844



                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.45it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.45it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
[A                                   

nll mean: 156.3701171875 	 kl mean: 8.724832534790039 	 loss mean: 165.09495544433594
nll mean: 117.01564025878906 	 kl mean: 9.16896915435791 	 loss mean: 126.18460845947266


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 10.12it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A


nll mean: 116.96843719482422 	 kl mean: 9.16896915435791 	 loss mean: 126.13740539550781
nll mean: 117.29638671875 	 kl mean: 9.16896915435791 	 loss mean: 126.46534729003906
nll mean: 116.96569061279297 	 kl mean: 9.16896915435791 	 loss mean: 126.13465881347656


 40%|████      | 4/10 [00:00<00:00, 10.12it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.15it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s][A

nll mean: 116.8714370727539 	 kl mean: 9.16896915435791 	 loss mean: 126.04041290283203
nll mean: 116.64930725097656 	 kl mean: 9.16896915435791 	 loss mean: 125.81827545166016
nll mean: 116.55072021484375 	 kl mean: 9.16896915435791 	 loss mean: 125.71968841552734



                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.17it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.18it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 116.230712890625 	 kl mean: 9.16896915435791 	 loss mean: 125.39967346191406
nll mean: 117.12423706054688 	 kl mean: 9.16896915435791 	 loss mean: 126.293212890625
nll mean: 116.11204528808594 	 kl mean: 9.16896915435791 	 loss mean: 125.28101348876953



                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
 40%|████      | 4/10 [00:00<00:00, 33.06it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s][A

nll mean: 106.99803924560547 	 kl mean: 7.697331428527832 	 loss mean: 114.69537353515625
nll mean: 106.7606201171875 	 kl mean: 7.697331428527832 	 loss mean: 114.45794677734375
nll mean: 107.0318603515625 	 kl mean: 7.697331428527832 	 loss mean: 114.72918701171875
nll mean: 106.38174438476562 	 kl mean: 7.697331428527832 	 loss mean: 114.0790786743164
nll mean: 106.46156311035156 	 kl mean: 7.697331428527832 	 loss mean: 114.15888977050781
nll mean: 107.21318817138672 	 kl mean: 7.697331428527832 	 loss mean: 114.9105224609375
nll mean: 106.82814025878906 	 kl mean: 7.697331428527832 	 loss mean: 114.52546691894531



                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s][A
 80%|████████  | 8/10 [00:00<00:00, 32.96it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 32.80it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               

nll mean: 106.79890441894531 	 kl mean: 7.697331428527832 	 loss mean: 114.49623107910156
nll mean: 107.26133728027344 	 kl mean: 7.697331428527832 	 loss mean: 114.95867919921875
nll mean: 107.41423034667969 	 kl mean: 7.697331428527832 	 loss mean: 115.11156463623047
nll mean: 158.88827514648438 	 kl mean: 8.705812454223633 	 loss mean: 167.59408569335938



 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.60it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.62it/s][A

nll mean: 159.12811279296875 	 kl mean: 8.705812454223633 	 loss mean: 167.83392333984375
nll mean: 159.50228881835938 	 kl mean: 8.705812454223633 	 loss mean: 168.20809936523438
nll mean: 158.723876953125 	 kl mean: 8.705812454223633 	 loss mean: 167.4296875



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.62it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A

nll mean: 158.57398986816406 	 kl mean: 8.705812454223633 	 loss mean: 167.27981567382812
nll mean: 158.70416259765625 	 kl mean: 8.705812454223633 	 loss mean: 167.4099884033203
nll mean: 158.7672882080078 	 kl mean: 8.705812454223633 	 loss mean: 167.4730987548828



                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.63it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.62it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 158.8874969482422 	 kl mean: 8.705812454223633 	 loss mean: 167.5933074951172
nll mean: 159.18887329101562 	 kl mean: 8.705812454223633 	 loss mean: 167.8946990966797
nll mean: 158.63864135742188 	 kl mean: 8.705812454223633 	 loss mean: 167.34445190429688
nll mean: 120.4775161743164 	 kl mean: 9.71940803527832 	 loss mean: 130.19692993164062


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 21.90it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.72it/s][A

nll mean: 120.43840789794922 	 kl mean: 9.71940803527832 	 loss mean: 130.15782165527344
nll mean: 120.11084747314453 	 kl mean: 9.71940803527832 	 loss mean: 129.8302459716797
nll mean: 120.12781524658203 	 kl mean: 9.71940803527832 	 loss mean: 129.84722900390625
nll mean: 120.06509399414062 	 kl mean: 9.71940803527832 	 loss mean: 129.78448486328125
nll mean: 120.29450988769531 	 kl mean: 9.71940803527832 	 loss mean: 130.013916015625


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.72it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 21.31it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.33636474609375 	 kl mean: 9.71940803527832 	 loss mean: 130.0557861328125
nll mean: 120.42897033691406 	 kl mean: 9.71940803527832 	 loss mean: 130.14837646484375
nll mean: 120.52241516113281 	 kl mean: 9.71940803527832 	 loss mean: 130.2418212890625
nll mean: 120.32958984375 	 kl mean: 9.71940803527832 	 loss mean: 130.04901123046875


                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.75it/s][A

nll mean: 114.07025909423828 	 kl mean: 8.816764831542969 	 loss mean: 122.88702392578125
nll mean: 114.3563461303711 	 kl mean: 8.816764831542969 	 loss mean: 123.17311096191406
nll mean: 114.3008041381836 	 kl mean: 8.816764831542969 	 loss mean: 123.11756896972656


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.75it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 40%|████      | 4/10 [00:00<00:00, 14.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.76it/s][A

nll mean: 114.6611557006836 	 kl mean: 8.816764831542969 	 loss mean: 123.47792053222656
nll mean: 114.83625030517578 	 kl mean: 8.816764831542969 	 loss mean: 123.65300750732422
nll mean: 114.67927551269531 	 kl mean: 8.816764831542969 	 loss mean: 123.49604797363281


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.76it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.73it/s][A

nll mean: 113.72028350830078 	 kl mean: 8.816764831542969 	 loss mean: 122.53704071044922
nll mean: 114.07189178466797 	 kl mean: 8.816764831542969 	 loss mean: 122.88865661621094
nll mean: 113.91840362548828 	 kl mean: 8.816764831542969 	 loss mean: 122.73516082763672


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.73it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.66it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 21.76it/s][A

nll mean: 114.23617553710938 	 kl mean: 8.816764831542969 	 loss mean: 123.05293273925781
nll mean: 81.85470581054688 	 kl mean: 8.117929458618164 	 loss mean: 89.97264099121094
nll mean: 81.34175872802734 	 kl mean: 8.117929458618164 	 loss mean: 89.45968627929688
nll mean: 82.3480224609375 	 kl mean: 8.117929458618164 	 loss mean: 90.4659423828125
nll mean: 81.76114654541016 	 kl mean: 8.117929458618164 	 loss mean: 89.87907409667969


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 21.76it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.77it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 22.07it/s][A

nll mean: 81.75642395019531 	 kl mean: 8.117929458618164 	 loss mean: 89.87435150146484
nll mean: 81.73377227783203 	 kl mean: 8.117929458618164 	 loss mean: 89.85169982910156
nll mean: 81.74930572509766 	 kl mean: 8.117929458618164 	 loss mean: 89.86723327636719
nll mean: 81.72856140136719 	 kl mean: 8.117929458618164 	 loss mean: 89.84648895263672
nll mean: 81.71794128417969 	 kl mean: 8.117929458618164 	 loss mean: 89.83587646484375


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
100%|██████████| 10/10 [00:00<00:00, 21.90it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.69it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A

nll mean: 81.97959899902344 	 kl mean: 8.117929458618164 	 loss mean: 90.09752655029297
nll mean: 109.48933410644531 	 kl mean: 7.865001201629639 	 loss mean: 117.35433197021484
nll mean: 109.822265625 	 kl mean: 7.865001201629639 	 loss mean: 117.68727111816406
nll mean: 109.7327880859375 	 kl mean: 7.865001201629639 	 loss mean: 117.59779357910156
nll mean: 110.2516860961914 	 kl mean: 7.865001201629639 	 loss mean: 118.11669921875



                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.53it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.54it/s][A

nll mean: 110.29034423828125 	 kl mean: 7.865001201629639 	 loss mean: 118.15534210205078
nll mean: 109.66703033447266 	 kl mean: 7.865001201629639 	 loss mean: 117.53202819824219
nll mean: 109.51460266113281 	 kl mean: 7.865001201629639 	 loss mean: 117.37960052490234
nll mean: 110.15409851074219 	 kl mean: 7.865001201629639 	 loss mean: 118.01910400390625
nll mean: 110.08711242675781 	 kl mean: 7.865001201629639 	 loss mean: 117.95211791992188



                                               
100%|██████████| 10/10 [00:00<00:00, 21.54it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.33it/s][A

nll mean: 109.55096435546875 	 kl mean: 7.865001201629639 	 loss mean: 117.41596221923828
nll mean: 121.29486083984375 	 kl mean: 9.01449966430664 	 loss mean: 130.30935668945312
nll mean: 121.11323547363281 	 kl mean: 9.01449966430664 	 loss mean: 130.1277313232422



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.46it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A

nll mean: 120.89341735839844 	 kl mean: 9.01449966430664 	 loss mean: 129.90792846679688
nll mean: 121.04874420166016 	 kl mean: 9.01449966430664 	 loss mean: 130.063232421875
nll mean: 121.30699157714844 	 kl mean: 9.01449966430664 	 loss mean: 130.32147216796875



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.51it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.51it/s][A

nll mean: 121.28927612304688 	 kl mean: 9.01449966430664 	 loss mean: 130.30377197265625
nll mean: 120.93144226074219 	 kl mean: 9.01449966430664 	 loss mean: 129.94593811035156
nll mean: 120.4970703125 	 kl mean: 9.01449966430664 	 loss mean: 129.51156616210938



                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s][A
                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.55it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]

nll mean: 120.79681396484375 	 kl mean: 9.01449966430664 	 loss mean: 129.81130981445312
nll mean: 120.9797592163086 	 kl mean: 9.01449966430664 	 loss mean: 129.9942626953125
nll mean: 60.83161926269531 	 kl mean: 9.730745315551758 	 loss mean: 70.56236267089844



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00,  9.88it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.98it/s][A

nll mean: 60.919918060302734 	 kl mean: 9.730745315551758 	 loss mean: 70.65066528320312
nll mean: 61.00164031982422 	 kl mean: 9.730745315551758 	 loss mean: 70.73238372802734
nll mean: 61.2509765625 	 kl mean: 9.730745315551758 	 loss mean: 70.98171997070312



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.94it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.88it/s][A

nll mean: 60.91374206542969 	 kl mean: 9.730745315551758 	 loss mean: 70.64448547363281
nll mean: 60.80440902709961 	 kl mean: 9.730745315551758 	 loss mean: 70.53515625



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.89it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.93it/s][A
                                               

nll mean: 61.059165954589844 	 kl mean: 9.730745315551758 	 loss mean: 70.78990173339844
nll mean: 60.18819808959961 	 kl mean: 9.730745315551758 	 loss mean: 69.9189453125



 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.93it/s][A
                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.94it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]

nll mean: 60.86172103881836 	 kl mean: 9.730745315551758 	 loss mean: 70.59246826171875
nll mean: 61.77140426635742 	 kl mean: 9.730745315551758 	 loss mean: 71.50215148925781
nll mean: 104.1751708984375 	 kl mean: 9.257952690124512 	 loss mean: 113.43312072753906



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 20%|██        | 2/10 [00:00<00:00, 13.10it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.04it/s][A

nll mean: 104.91178131103516 	 kl mean: 9.257952690124512 	 loss mean: 114.16972351074219
nll mean: 103.72307586669922 	 kl mean: 9.257952690124512 	 loss mean: 112.98102569580078
nll mean: 103.84337615966797 	 kl mean: 9.257952690124512 	 loss mean: 113.10133361816406



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.90it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A

nll mean: 103.74839782714844 	 kl mean: 9.257952690124512 	 loss mean: 113.00635528564453
nll mean: 104.26766967773438 	 kl mean: 9.257952690124512 	 loss mean: 113.52561950683594
nll mean: 103.9526138305664 	 kl mean: 9.257952690124512 	 loss mean: 113.2105712890625



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.79it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.78it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 104.763916015625 	 kl mean: 9.257952690124512 	 loss mean: 114.0218734741211
nll mean: 103.28114318847656 	 kl mean: 9.257952690124512 	 loss mean: 112.53909301757812
nll mean: 103.98748779296875 	 kl mean: 9.257952690124512 	 loss mean: 113.24543762207031



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 10%|█         | 1/10 [00:00<00:00,  9.94it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.01it/s][A

nll mean: 138.69253540039062 	 kl mean: 9.563274383544922 	 loss mean: 148.2558135986328
nll mean: 138.03115844726562 	 kl mean: 9.563274383544922 	 loss mean: 147.59442138671875
nll mean: 138.63014221191406 	 kl mean: 9.563274383544922 	 loss mean: 148.1934356689453



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.97it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A

nll mean: 138.68641662597656 	 kl mean: 9.563274383544922 	 loss mean: 148.24969482421875
nll mean: 138.26023864746094 	 kl mean: 9.563274383544922 	 loss mean: 147.82351684570312
nll mean: 138.69818115234375 	 kl mean: 9.563274383544922 	 loss mean: 148.26145935058594



 60%|██████    | 6/10 [00:00<00:00, 10.00it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.97it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.97it/s][A
[A                                           

nll mean: 138.3076934814453 	 kl mean: 9.563274383544922 	 loss mean: 147.8709716796875
nll mean: 138.39254760742188 	 kl mean: 9.563274383544922 	 loss mean: 147.955810546875


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.96it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 10.01it/s][A
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:20<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 139.1182098388672 	 kl mean: 9.563274383544922 	 loss mean: 148.68148803710938
nll mean: 138.3102569580078 	 kl mean: 9.563274383544922 	 loss mean: 147.87353515625
nll mean: 62.17609786987305 	 kl mean: 8.54819107055664 	 loss mean: 70.72428131103516
nll mean: 61.3813591003418 	 kl mean: 8.54819107055664 	 loss mean: 69.92955017089844


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 30%|███       | 3/10 [00:00<00:00, 26.50it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 60%|██████    | 6/10 [00:00<00:00, 26.09it/s]

nll mean: 61.681243896484375 	 kl mean: 8.54819107055664 	 loss mean: 70.22943878173828
nll mean: 61.806373596191406 	 kl mean: 8.54819107055664 	 loss mean: 70.35456848144531
nll mean: 62.21870803833008 	 kl mean: 8.54819107055664 	 loss mean: 70.76689910888672
nll mean: 61.38202667236328 	 kl mean: 8.54819107055664 	 loss mean: 69.93022155761719
nll mean: 62.39936828613281 	 kl mean: 8.54819107055664 	 loss mean: 70.94755554199219
nll mean: 62.065425872802734 	 kl mean: 8.54819107055664 	 loss mean: 70.61361694335938


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 60%|██████    | 6/10 [00:00<00:00, 26.09it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
100%|██████████| 10/10 [00:00<00:00, 25.42it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 30%|███       | 3/10 [00:00<00:00, 21.17it/s][A

nll mean: 61.68160629272461 	 kl mean: 8.54819107055664 	 loss mean: 70.22979736328125
nll mean: 61.29724884033203 	 kl mean: 8.54819107055664 	 loss mean: 69.84544372558594
nll mean: 118.4932632446289 	 kl mean: 8.4747314453125 	 loss mean: 126.96800231933594
nll mean: 118.18550109863281 	 kl mean: 8.4747314453125 	 loss mean: 126.66022491455078
nll mean: 118.72625732421875 	 kl mean: 8.4747314453125 	 loss mean: 127.20098876953125



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.04it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A

nll mean: 118.69490051269531 	 kl mean: 8.4747314453125 	 loss mean: 127.16962432861328
nll mean: 117.76180267333984 	 kl mean: 8.4747314453125 	 loss mean: 126.23654174804688
nll mean: 118.15425109863281 	 kl mean: 8.4747314453125 	 loss mean: 126.62899017333984
nll mean: 118.06430053710938 	 kl mean: 8.4747314453125 	 loss mean: 126.53902435302734
nll mean: 118.14497375488281 	 kl mean: 8.4747314453125 	 loss mean: 126.61970520019531



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.07it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 20.99it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.22453308105469 	 kl mean: 8.4747314453125 	 loss mean: 126.69926452636719
nll mean: 118.50558471679688 	 kl mean: 8.4747314453125 	 loss mean: 126.98031616210938
nll mean: 119.28338623046875 	 kl mean: 9.434602737426758 	 loss mean: 128.71798706054688


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.56it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.60it/s][A

nll mean: 119.36192321777344 	 kl mean: 9.434602737426758 	 loss mean: 128.79652404785156
nll mean: 119.07125091552734 	 kl mean: 9.434602737426758 	 loss mean: 128.505859375
nll mean: 118.60333251953125 	 kl mean: 9.434602737426758 	 loss mean: 128.03793334960938


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 40%|████      | 4/10 [00:00<00:00, 12.60it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.50it/s][A

nll mean: 119.00489044189453 	 kl mean: 9.434602737426758 	 loss mean: 128.43948364257812
nll mean: 119.33453369140625 	 kl mean: 9.434602737426758 	 loss mean: 128.7691192626953
nll mean: 118.74427795410156 	 kl mean: 9.434602737426758 	 loss mean: 128.1788787841797


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.50it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.52it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.47it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.98834228515625 	 kl mean: 9.434602737426758 	 loss mean: 128.42295837402344
nll mean: 119.89219665527344 	 kl mean: 9.434602737426758 	 loss mean: 129.32681274414062
nll mean: 118.85087585449219 	 kl mean: 9.434602737426758 	 loss mean: 128.2854766845703



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.65it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s][A

nll mean: 113.34986114501953 	 kl mean: 8.59105110168457 	 loss mean: 121.94091033935547
nll mean: 114.1915283203125 	 kl mean: 8.59105110168457 	 loss mean: 122.78257751464844
nll mean: 113.77548217773438 	 kl mean: 8.59105110168457 	 loss mean: 122.36653137207031



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.62it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.60it/s][A

nll mean: 113.76025390625 	 kl mean: 8.59105110168457 	 loss mean: 122.35130310058594
nll mean: 113.792724609375 	 kl mean: 8.59105110168457 	 loss mean: 122.38377380371094
nll mean: 114.05128479003906 	 kl mean: 8.59105110168457 	 loss mean: 122.64234161376953



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.58it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A

nll mean: 113.75601959228516 	 kl mean: 8.59105110168457 	 loss mean: 122.34707641601562
nll mean: 114.04176330566406 	 kl mean: 8.59105110168457 	 loss mean: 122.6328125
nll mean: 113.6943130493164 	 kl mean: 8.59105110168457 	 loss mean: 122.28536224365234



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.57it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 22.78it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A

nll mean: 113.40834045410156 	 kl mean: 8.59105110168457 	 loss mean: 121.9993896484375
nll mean: 110.53711700439453 	 kl mean: 8.656253814697266 	 loss mean: 119.19337463378906
nll mean: 110.57293701171875 	 kl mean: 8.656253814697266 	 loss mean: 119.22918701171875
nll mean: 110.12078857421875 	 kl mean: 8.656253814697266 	 loss mean: 118.77705383300781
nll mean: 110.58100128173828 	 kl mean: 8.656253814697266 	 loss mean: 119.23724365234375



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
 50%|█████     | 5/10 [00:00<00:00, 21.61it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
 80%|████████  | 8/10 [00:00<00:00, 21.51it/s][A
                                               
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s][A

nll mean: 110.68183898925781 	 kl mean: 8.656253814697266 	 loss mean: 119.33808898925781
nll mean: 110.96375274658203 	 kl mean: 8.656253814697266 	 loss mean: 119.62001037597656
nll mean: 110.51507568359375 	 kl mean: 8.656253814697266 	 loss mean: 119.17132568359375
nll mean: 110.75835418701172 	 kl mean: 8.656253814697266 	 loss mean: 119.41461181640625
nll mean: 109.94792938232422 	 kl mean: 8.656253814697266 	 loss mean: 118.60418701171875



                                               
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s][A
100%|██████████| 10/10 [00:00<00:00, 20.80it/s][A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
 40%|████      | 4/10 [00:00<00:00, 30.65it/s][A

nll mean: 110.33194732666016 	 kl mean: 8.656253814697266 	 loss mean: 118.98820495605469
nll mean: 86.38906860351562 	 kl mean: 9.740373611450195 	 loss mean: 96.12944030761719
nll mean: 84.76604461669922 	 kl mean: 9.740373611450195 	 loss mean: 94.50640869140625
nll mean: 85.78645324707031 	 kl mean: 9.740373611450195 	 loss mean: 95.52682495117188
nll mean: 85.64801025390625 	 kl mean: 9.740373611450195 	 loss mean: 95.38839721679688
nll mean: 85.52317810058594 	 kl mean: 9.740373611450195 	 loss mean: 95.26353454589844


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
 40%|████      | 4/10 [00:00<00:00, 30.65it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
100%|██████████| 10/10 [00:00<00:00, 30.25it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.56it/s]


nll mean: 85.25126647949219 	 kl mean: 9.740373611450195 	 loss mean: 94.99163818359375
nll mean: 85.25393676757812 	 kl mean: 9.740373611450195 	 loss mean: 94.99430847167969
nll mean: 85.59688568115234 	 kl mean: 9.740373611450195 	 loss mean: 95.33726501464844
nll mean: 86.16988372802734 	 kl mean: 9.740373611450195 	 loss mean: 95.91026306152344
nll mean: 85.92730712890625 	 kl mean: 9.740373611450195 	 loss mean: 95.66768646240234
Approximate NLL:
tensor(120.9362, device='cuda:0')
Approximate KL:
tensor(8.9841, device='cuda:0')
Testing took 0:00:25.409169


  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .78it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .78it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.78it/s][A

nll mean: 108.8780517578125 	 kl mean: 9.823039054870605 	 loss mean: 118.70109558105469
nll mean: 108.84358215332031 	 kl mean: 9.823039054870605 	 loss mean: 118.6666259765625
nll mean: 108.57289123535156 	 kl mean: 9.823039054870605 	 loss mean: 118.39593505859375
nll mean: 109.06285095214844 	 kl mean: 9.823039054870605 	 loss mean: 118.88589477539062
nll mean: 109.31573486328125 	 kl mean: 9.823039054870605 	 loss mean: 119.1387710571289


                                      
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.78it/s][A
                                      .39it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .39it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .39it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 25.39it/s][A
                                      .10it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 24.82it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 108.94084930419922 	 kl mean: 9.823039054870605 	 loss mean: 118.76388549804688
nll mean: 109.07747650146484 	 kl mean: 9.823039054870605 	 loss mean: 118.9005126953125
nll mean: 109.05863189697266 	 kl mean: 9.823039054870605 	 loss mean: 118.88167572021484
nll mean: 109.74530029296875 	 kl mean: 9.823039054870605 	 loss mean: 119.56834411621094
nll mean: 109.67315673828125 	 kl mean: 9.823039054870605 	 loss mean: 119.4961929321289


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 20%|██        | 2/10 [00:00<00:00, 13.91it/s][A

nll mean: 126.97502136230469 	 kl mean: 9.665081977844238 	 loss mean: 136.64010620117188
nll mean: 126.96321105957031 	 kl mean: 9.665081977844238 	 loss mean: 136.6282958984375
nll mean: 127.10377502441406 	 kl mean: 9.665081977844238 	 loss mean: 136.76885986328125


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 20%|██        | 2/10 [00:00<00:00, 13.91it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 40%|████      | 4/10 [00:00<00:00, 13.89it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.89it/s][A

nll mean: 126.9528579711914 	 kl mean: 9.665081977844238 	 loss mean: 136.61793518066406
nll mean: 127.35737609863281 	 kl mean: 9.665081977844238 	 loss mean: 137.0224609375
nll mean: 127.25811767578125 	 kl mean: 9.665081977844238 	 loss mean: 136.92320251464844


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.89it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.91it/s][A

nll mean: 127.51203918457031 	 kl mean: 9.665081977844238 	 loss mean: 137.1771240234375
nll mean: 126.87287902832031 	 kl mean: 9.665081977844238 	 loss mean: 136.53794860839844
nll mean: 127.6448745727539 	 kl mean: 9.665081977844238 	 loss mean: 137.30996704101562


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.91it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.01it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 24.77it/s][A

nll mean: 127.01142883300781 	 kl mean: 9.665081977844238 	 loss mean: 136.67649841308594
nll mean: 98.48988342285156 	 kl mean: 8.926055908203125 	 loss mean: 107.41593933105469
nll mean: 99.36991882324219 	 kl mean: 8.926055908203125 	 loss mean: 108.29597473144531
nll mean: 98.24906158447266 	 kl mean: 8.926055908203125 	 loss mean: 107.17511749267578
nll mean: 98.43311309814453 	 kl mean: 8.926055908203125 	 loss mean: 107.35916137695312


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 24.77it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.37it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.16it/s][A

nll mean: 98.45321655273438 	 kl mean: 8.926055908203125 	 loss mean: 107.3792724609375
nll mean: 99.04397583007812 	 kl mean: 8.926055908203125 	 loss mean: 107.97002410888672
nll mean: 98.9697265625 	 kl mean: 8.926055908203125 	 loss mean: 107.89578247070312
nll mean: 98.9140625 	 kl mean: 8.926055908203125 	 loss mean: 107.84011840820312
nll mean: 98.68357849121094 	 kl mean: 8.926055908203125 	 loss mean: 107.60962677001953


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
100%|██████████| 10/10 [00:00<00:00, 23.84it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.60it/s][A

nll mean: 98.39352416992188 	 kl mean: 8.926055908203125 	 loss mean: 107.319580078125
nll mean: 137.26295471191406 	 kl mean: 9.639511108398438 	 loss mean: 146.90245056152344
nll mean: 137.61338806152344 	 kl mean: 9.639511108398438 	 loss mean: 147.25289916992188


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.10it/s]
 20%|██        | 2/10 [00:00<00:00, 10.60it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 40%|████      | 4/10 [00:00<00:00, 10.59it/s][A

nll mean: 137.0572509765625 	 kl mean: 9.639511108398438 	 loss mean: 146.69676208496094
nll mean: 137.66004943847656 	 kl mean: 9.639511108398438 	 loss mean: 147.29954528808594
nll mean: 137.95596313476562 	 kl mean: 9.639511108398438 	 loss mean: 147.59548950195312


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 40%|████      | 4/10 [00:00<00:00, 10.59it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.60it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.55it/s][A

nll mean: 137.34658813476562 	 kl mean: 9.639511108398438 	 loss mean: 146.986083984375
nll mean: 137.8732147216797 	 kl mean: 9.639511108398438 	 loss mean: 147.51272583007812
nll mean: 137.1504364013672 	 kl mean: 9.639511108398438 	 loss mean: 146.78994750976562


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.10it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.55it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.52it/s][A
 11%|█         | 4/38 [00:02<00:21,  1.62it/s]
                                              
 11%|█         | 4/38 [00:02<00:21,  1.62it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 137.47686767578125 	 kl mean: 9.639511108398438 	 loss mean: 147.11636352539062
nll mean: 137.0079345703125 	 kl mean: 9.639511108398438 	 loss mean: 146.64744567871094
nll mean: 125.77889251708984 	 kl mean: 9.104228973388672 	 loss mean: 134.88311767578125


                                              
 11%|█         | 4/38 [00:02<00:21,  1.62it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:21,  1.62it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:21,  1.62it/s]
 20%|██        | 2/10 [00:00<00:00, 13.83it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.64it/s][A

nll mean: 126.0237045288086 	 kl mean: 9.104228973388672 	 loss mean: 135.1279296875
nll mean: 125.33844757080078 	 kl mean: 9.104228973388672 	 loss mean: 134.4426727294922
nll mean: 125.64403533935547 	 kl mean: 9.104228973388672 	 loss mean: 134.74827575683594


                                              
 11%|█         | 4/38 [00:02<00:21,  1.62it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:21,  1.62it/s]
 40%|████      | 4/10 [00:00<00:00, 13.64it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:21,  1.62it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.68it/s][A

nll mean: 125.87740325927734 	 kl mean: 9.104228973388672 	 loss mean: 134.98162841796875
nll mean: 126.48189544677734 	 kl mean: 9.104228973388672 	 loss mean: 135.58612060546875
nll mean: 126.34332275390625 	 kl mean: 9.104228973388672 	 loss mean: 135.4475555419922


                                              
 11%|█         | 4/38 [00:03<00:21,  1.62it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.68it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:21,  1.62it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:21,  1.62it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.74it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.74it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 126.80648040771484 	 kl mean: 9.104228973388672 	 loss mean: 135.91070556640625
nll mean: 125.65347290039062 	 kl mean: 9.104228973388672 	 loss mean: 134.75770568847656
nll mean: 126.0835189819336 	 kl mean: 9.104228973388672 	 loss mean: 135.187744140625


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 13.53it/s][A

nll mean: 122.75428009033203 	 kl mean: 9.229398727416992 	 loss mean: 131.9836883544922
nll mean: 123.48106384277344 	 kl mean: 9.229398727416992 	 loss mean: 132.71046447753906
nll mean: 123.14738464355469 	 kl mean: 9.229398727416992 	 loss mean: 132.3767852783203


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 13.53it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 40%|████      | 4/10 [00:00<00:00, 13.67it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.76it/s][A

nll mean: 123.36712646484375 	 kl mean: 9.229398727416992 	 loss mean: 132.59652709960938
nll mean: 122.99333190917969 	 kl mean: 9.229398727416992 	 loss mean: 132.22271728515625
nll mean: 123.43891906738281 	 kl mean: 9.229398727416992 	 loss mean: 132.66830444335938


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.76it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.79it/s][A

nll mean: 123.53636169433594 	 kl mean: 9.229398727416992 	 loss mean: 132.7657470703125
nll mean: 122.83721923828125 	 kl mean: 9.229398727416992 	 loss mean: 132.06661987304688
nll mean: 123.45372772216797 	 kl mean: 9.229398727416992 	 loss mean: 132.68312072753906


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 13.79it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.83it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.48it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.48it/s]
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.48it/s]
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.48it/s]
 30%|███       | 3/10 [00:00<00:00, 24.42it/s][A

nll mean: 123.3350830078125 	 kl mean: 9.229398727416992 	 loss mean: 132.56448364257812
nll mean: 134.34298706054688 	 kl mean: 9.141291618347168 	 loss mean: 143.48428344726562
nll mean: 134.2837677001953 	 kl mean: 9.141291618347168 	 loss mean: 143.42507934570312
nll mean: 134.2982940673828 	 kl mean: 9.141291618347168 	 loss mean: 143.4395751953125
nll mean: 134.17831420898438 	 kl mean: 9.141291618347168 	 loss mean: 143.31959533691406


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.48it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.48it/s]
 30%|███       | 3/10 [00:00<00:00, 24.42it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.48it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.48it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.26it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.08it/s][A

nll mean: 134.3524169921875 	 kl mean: 9.141291618347168 	 loss mean: 143.4936981201172
nll mean: 134.212646484375 	 kl mean: 9.141291618347168 	 loss mean: 143.3539276123047
nll mean: 134.01434326171875 	 kl mean: 9.141291618347168 	 loss mean: 143.1556396484375
nll mean: 133.75680541992188 	 kl mean: 9.141291618347168 	 loss mean: 142.89810180664062
nll mean: 134.95310974121094 	 kl mean: 9.141291618347168 	 loss mean: 144.09439086914062


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.48it/s]
100%|██████████| 10/10 [00:00<00:00, 23.90it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.67it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.67it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.67it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.67it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.67it/s]
 30%|███       | 3/10 [00:00<00:00, 23.88it/s][A

nll mean: 134.44058227539062 	 kl mean: 9.141291618347168 	 loss mean: 143.58189392089844
nll mean: 104.74224853515625 	 kl mean: 9.147454261779785 	 loss mean: 113.88970184326172
nll mean: 105.32475280761719 	 kl mean: 9.147454261779785 	 loss mean: 114.47221374511719
nll mean: 105.38896942138672 	 kl mean: 9.147454261779785 	 loss mean: 114.53642272949219
nll mean: 105.454345703125 	 kl mean: 9.147454261779785 	 loss mean: 114.601806640625


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.67it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.67it/s]
 30%|███       | 3/10 [00:00<00:00, 23.88it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.67it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.67it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.67it/s]
 60%|██████    | 6/10 [00:00<00:00, 23.87it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 23.76it/s][A

nll mean: 104.98471069335938 	 kl mean: 9.147454261779785 	 loss mean: 114.13216400146484
nll mean: 105.73164367675781 	 kl mean: 9.147454261779785 	 loss mean: 114.87908935546875
nll mean: 105.29927062988281 	 kl mean: 9.147454261779785 	 loss mean: 114.44673156738281
nll mean: 104.80268096923828 	 kl mean: 9.147454261779785 	 loss mean: 113.95013427734375
nll mean: 104.5912094116211 	 kl mean: 9.147454261779785 	 loss mean: 113.73866271972656


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.67it/s]
100%|██████████| 10/10 [00:00<00:00, 23.58it/s][A
 21%|██        | 8/38 [00:04<00:16,  1.83it/s]
                                              
 21%|██        | 8/38 [00:04<00:16,  1.83it/s]
                                              
 21%|██        | 8/38 [00:04<00:16,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.52it/s][A

nll mean: 104.76732635498047 	 kl mean: 9.147454261779785 	 loss mean: 113.91477966308594
nll mean: 130.39791870117188 	 kl mean: 10.27691650390625 	 loss mean: 140.67481994628906
nll mean: 130.18321228027344 	 kl mean: 10.27691650390625 	 loss mean: 140.46011352539062


                                              
 21%|██        | 8/38 [00:05<00:16,  1.83it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.83it/s]
 20%|██        | 2/10 [00:00<00:00, 14.52it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.83it/s]
                                              [A

nll mean: 130.69236755371094 	 kl mean: 10.27691650390625 	 loss mean: 140.96926879882812
nll mean: 131.013916015625 	 kl mean: 10.27691650390625 	 loss mean: 141.29083251953125
nll mean: 130.94754028320312 	 kl mean: 10.27691650390625 	 loss mean: 141.22445678710938



 21%|██        | 8/38 [00:05<00:16,  1.83it/s]
 40%|████      | 4/10 [00:00<00:00, 14.53it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.83it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.83it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.51it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.83it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.83it/s][A

nll mean: 130.26429748535156 	 kl mean: 10.27691650390625 	 loss mean: 140.54122924804688
nll mean: 130.41355895996094 	 kl mean: 10.27691650390625 	 loss mean: 140.6904754638672
nll mean: 130.08045959472656 	 kl mean: 10.27691650390625 	 loss mean: 140.3573760986328
nll mean: 131.5587158203125 	 kl mean: 10.27691650390625 	 loss mean: 141.8356170654297


                                              
 21%|██        | 8/38 [00:05<00:16,  1.83it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.83it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.69it/s][A
 24%|██▎       | 9/38 [00:05<00:17,  1.70it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:17,  1.70it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:17,  1.70it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:17,  1.70it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
                                              

nll mean: 130.12884521484375 	 kl mean: 10.27691650390625 	 loss mean: 140.40576171875
nll mean: 128.00498962402344 	 kl mean: 10.041580200195312 	 loss mean: 138.0465850830078
nll mean: 128.28294372558594 	 kl mean: 10.041580200195312 	 loss mean: 138.32452392578125
nll mean: 128.38821411132812 	 kl mean: 10.041580200195312 	 loss mean: 138.42979431152344


 24%|██▎       | 9/38 [00:05<00:17,  1.70it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:17,  1.70it/s]
 30%|███       | 3/10 [00:00<00:00, 20.89it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:17,  1.70it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:17,  1.70it/s]
 50%|█████     | 5/10 [00:00<00:00, 20.54it/s][A
 70%|███████   | 7/10 [00:00<00:00, 20.28it/s][A

nll mean: 128.3668212890625 	 kl mean: 10.041580200195312 	 loss mean: 138.4084014892578
nll mean: 128.70420837402344 	 kl mean: 10.041580200195312 	 loss mean: 138.74578857421875
nll mean: 128.72439575195312 	 kl mean: 10.041580200195312 	 loss mean: 138.76597595214844
nll mean: 129.2725067138672 	 kl mean: 10.041580200195312 	 loss mean: 139.3140869140625


                                              
 24%|██▎       | 9/38 [00:05<00:17,  1.70it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:17,  1.70it/s]
 70%|███████   | 7/10 [00:00<00:00, 20.28it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:17,  1.70it/s]
100%|██████████| 10/10 [00:00<00:00, 19.95it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.78it/s]
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.78it/s]
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.78it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 128.7857666015625 	 kl mean: 10.041580200195312 	 loss mean: 138.82736206054688
nll mean: 129.44784545898438 	 kl mean: 10.041580200195312 	 loss mean: 139.48941040039062
nll mean: 128.28707885742188 	 kl mean: 10.041580200195312 	 loss mean: 138.32867431640625
nll mean: 118.55032348632812 	 kl mean: 9.892952919006348 	 loss mean: 128.4432830810547
nll mean: 118.49063873291016 	 kl mean: 9.892952919006348 	 loss mean: 128.38357543945312


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.78it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.78it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.78it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.78it/s]
 30%|███       | 3/10 [00:00<00:00, 23.77it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.78it/s]
 60%|██████    | 6/10 [00:00<00:00, 23.71it/s][A

nll mean: 118.54020690917969 	 kl mean: 9.892952919006348 	 loss mean: 128.43316650390625
nll mean: 119.08792114257812 	 kl mean: 9.892952919006348 	 loss mean: 128.98086547851562
nll mean: 118.390380859375 	 kl mean: 9.892952919006348 	 loss mean: 128.2833251953125
nll mean: 118.01689147949219 	 kl mean: 9.892952919006348 	 loss mean: 127.90984344482422
nll mean: 118.22848510742188 	 kl mean: 9.892952919006348 	 loss mean: 128.12142944335938


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.78it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.78it/s]
 60%|██████    | 6/10 [00:00<00:00, 23.71it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.78it/s]
100%|██████████| 10/10 [00:00<00:00, 23.58it/s][A
 29%|██▉       | 11/38 [00:06<00:14,  1.92it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:14,  1.92it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:14,  1.92it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.46437072753906 	 kl mean: 9.892952919006348 	 loss mean: 128.35731506347656
nll mean: 118.68939971923828 	 kl mean: 9.892952919006348 	 loss mean: 128.5823516845703
nll mean: 118.7412109375 	 kl mean: 9.892952919006348 	 loss mean: 128.6341552734375
nll mean: 141.56167602539062 	 kl mean: 10.114208221435547 	 loss mean: 151.6759033203125
nll mean: 141.97573852539062 	 kl mean: 10.114208221435547 	 loss mean: 152.0899658203125


                                               
 29%|██▉       | 11/38 [00:06<00:14,  1.92it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:14,  1.92it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:14,  1.92it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:14,  1.92it/s]
 30%|███       | 3/10 [00:00<00:00, 20.59it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:14,  1.92it/s]
 60%|██████    | 6/10 [00:00<00:00, 20.63it/s][A

nll mean: 141.23904418945312 	 kl mean: 10.114208221435547 	 loss mean: 151.353271484375
nll mean: 140.37547302246094 	 kl mean: 10.114208221435547 	 loss mean: 150.48968505859375
nll mean: 141.77951049804688 	 kl mean: 10.114208221435547 	 loss mean: 151.89370727539062
nll mean: 141.1970672607422 	 kl mean: 10.114208221435547 	 loss mean: 151.31129455566406
nll mean: 141.060546875 	 kl mean: 10.114208221435547 	 loss mean: 151.17474365234375


                                               
 29%|██▉       | 11/38 [00:06<00:14,  1.92it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:14,  1.92it/s]
 60%|██████    | 6/10 [00:00<00:00, 20.63it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:14,  1.92it/s]
100%|██████████| 10/10 [00:00<00:00, 20.55it/s][A
 32%|███▏      | 12/38 [00:06<00:13,  1.95it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:13,  1.95it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 141.55361938476562 	 kl mean: 10.114208221435547 	 loss mean: 151.66781616210938
nll mean: 141.4785919189453 	 kl mean: 10.114208221435547 	 loss mean: 151.59280395507812
nll mean: 141.41555786132812 	 kl mean: 10.114208221435547 	 loss mean: 151.52975463867188
nll mean: 119.69029235839844 	 kl mean: 10.0911226272583 	 loss mean: 129.78143310546875


                                               
 32%|███▏      | 12/38 [00:07<00:13,  1.95it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:13,  1.95it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:13,  1.95it/s]
 20%|██        | 2/10 [00:00<00:00, 12.00it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.06it/s][A

nll mean: 118.68791198730469 	 kl mean: 10.0911226272583 	 loss mean: 128.77902221679688
nll mean: 119.68362426757812 	 kl mean: 10.0911226272583 	 loss mean: 129.77474975585938
nll mean: 118.68193817138672 	 kl mean: 10.0911226272583 	 loss mean: 128.7730712890625


                                               
 32%|███▏      | 12/38 [00:07<00:13,  1.95it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:13,  1.95it/s]
 40%|████      | 4/10 [00:00<00:00, 12.06it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:13,  1.95it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.16it/s][A

nll mean: 118.871826171875 	 kl mean: 10.0911226272583 	 loss mean: 128.96295166015625
nll mean: 119.16343688964844 	 kl mean: 10.0911226272583 	 loss mean: 129.2545623779297
nll mean: 118.93622589111328 	 kl mean: 10.0911226272583 	 loss mean: 129.02734375


                                               
 32%|███▏      | 12/38 [00:07<00:13,  1.95it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.16it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:13,  1.95it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:13,  1.95it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.24it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.31it/s][A
 34%|███▍      | 13/38 [00:07<00:15,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.73471069335938 	 kl mean: 10.0911226272583 	 loss mean: 128.82582092285156
nll mean: 119.06037902832031 	 kl mean: 10.0911226272583 	 loss mean: 129.15150451660156
nll mean: 119.2073974609375 	 kl mean: 10.0911226272583 	 loss mean: 129.29852294921875


                                               
 34%|███▍      | 13/38 [00:07<00:15,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:15,  1.66it/s]
 10%|█         | 1/10 [00:00<00:00,  9.83it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.81it/s][A

nll mean: 162.07989501953125 	 kl mean: 9.945308685302734 	 loss mean: 172.02520751953125
nll mean: 161.841064453125 	 kl mean: 9.945308685302734 	 loss mean: 171.78636169433594


                                               
 34%|███▍      | 13/38 [00:08<00:15,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00,  9.81it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:15,  1.66it/s]
 30%|███       | 3/10 [00:00<00:00,  9.76it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.77it/s][A

nll mean: 162.33544921875 	 kl mean: 9.945308685302734 	 loss mean: 172.28076171875
nll mean: 162.11325073242188 	 kl mean: 9.945308685302734 	 loss mean: 172.0585479736328


                                               
 34%|███▍      | 13/38 [00:08<00:15,  1.66it/s]
                                               [A
 34%|███▍      | 13/38 [00:08<00:15,  1.66it/s]
 40%|████      | 4/10 [00:00<00:00,  9.77it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:15,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.84it/s]

nll mean: 162.0926513671875 	 kl mean: 9.945308685302734 	 loss mean: 172.0379638671875
nll mean: 163.1751708984375 	 kl mean: 9.945308685302734 	 loss mean: 173.12049865722656
nll mean: 162.05303955078125 	 kl mean: 9.945308685302734 	 loss mean: 171.9983367919922


                                               
 34%|███▍      | 13/38 [00:08<00:15,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.84it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:15,  1.66it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.90it/s][A
                                               [A


nll mean: 162.3438720703125 	 kl mean: 9.945308685302734 	 loss mean: 172.2891845703125
nll mean: 162.11068725585938 	 kl mean: 9.945308685302734 	 loss mean: 172.05599975585938


 34%|███▍      | 13/38 [00:08<00:15,  1.66it/s]
100%|██████████| 10/10 [00:01<00:00,  9.91it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.38it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.38it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 18.41it/s][A

nll mean: 161.53314208984375 	 kl mean: 9.945308685302734 	 loss mean: 171.47845458984375
nll mean: 136.19512939453125 	 kl mean: 8.914510726928711 	 loss mean: 145.10964965820312
nll mean: 135.7028350830078 	 kl mean: 8.914510726928711 	 loss mean: 144.61734008789062
nll mean: 135.7802734375 	 kl mean: 8.914510726928711 	 loss mean: 144.69479370117188


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 18.41it/s][A
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.38it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.38it/s]
 40%|████      | 4/10 [00:00<00:00, 18.21it/s][A
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.38it/s]
 60%|██████    | 6/10 [00:00<00:00, 18.16it/s][A

nll mean: 136.35147094726562 	 kl mean: 8.914510726928711 	 loss mean: 145.2659912109375
nll mean: 135.5682373046875 	 kl mean: 8.914510726928711 	 loss mean: 144.48275756835938
nll mean: 135.73121643066406 	 kl mean: 8.914510726928711 	 loss mean: 144.64572143554688
nll mean: 135.67588806152344 	 kl mean: 8.914510726928711 	 loss mean: 144.59039306640625


                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.38it/s]
 60%|██████    | 6/10 [00:00<00:00, 18.16it/s][A
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.38it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.38it/s]
 80%|████████  | 8/10 [00:00<00:00, 18.02it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.97it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 136.63421630859375 	 kl mean: 8.914510726928711 	 loss mean: 145.54873657226562
nll mean: 135.98008728027344 	 kl mean: 8.914510726928711 	 loss mean: 144.8946075439453
nll mean: 136.56674194335938 	 kl mean: 8.914510726928711 	 loss mean: 145.48126220703125


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 10.79it/s][A

nll mean: 142.05291748046875 	 kl mean: 9.784601211547852 	 loss mean: 151.83750915527344
nll mean: 142.31117248535156 	 kl mean: 9.784601211547852 	 loss mean: 152.09576416015625
nll mean: 143.02354431152344 	 kl mean: 9.784601211547852 	 loss mean: 152.80813598632812


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 10.79it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 10.79it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.79it/s][A

nll mean: 142.57025146484375 	 kl mean: 9.784601211547852 	 loss mean: 152.3548583984375
nll mean: 142.33604431152344 	 kl mean: 9.784601211547852 	 loss mean: 152.12063598632812
nll mean: 142.15020751953125 	 kl mean: 9.784601211547852 	 loss mean: 151.93478393554688


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
                                               [A
 39%|███▉      | 15/38 [00:10<00:15,  1.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.79it/s][A
                                               [A
 39%|███▉      | 15/38 [00:10<00:15,  1.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.76it/s][A

nll mean: 142.64413452148438 	 kl mean: 9.784601211547852 	 loss mean: 152.42874145507812
nll mean: 142.1416473388672 	 kl mean: 9.784601211547852 	 loss mean: 151.92623901367188
nll mean: 142.72142028808594 	 kl mean: 9.784601211547852 	 loss mean: 152.5060272216797


                                               
 39%|███▉      | 15/38 [00:10<00:15,  1.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.76it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.68it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 24.23it/s][A

nll mean: 141.9366455078125 	 kl mean: 9.784601211547852 	 loss mean: 151.72125244140625
nll mean: 143.44790649414062 	 kl mean: 8.944929122924805 	 loss mean: 152.392822265625
nll mean: 143.67901611328125 	 kl mean: 8.944929122924805 	 loss mean: 152.6239471435547
nll mean: 144.16973876953125 	 kl mean: 8.944929122924805 	 loss mean: 153.1146697998047
nll mean: 143.53240966796875 	 kl mean: 8.944929122924805 	 loss mean: 152.4773406982422


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 24.23it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.08it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.21it/s][A

nll mean: 144.43637084960938 	 kl mean: 8.944929122924805 	 loss mean: 153.38128662109375
nll mean: 143.79371643066406 	 kl mean: 8.944929122924805 	 loss mean: 152.7386474609375
nll mean: 143.7899169921875 	 kl mean: 8.944929122924805 	 loss mean: 152.73484802246094
nll mean: 143.8414764404297 	 kl mean: 8.944929122924805 	 loss mean: 152.78640747070312
nll mean: 144.1165313720703 	 kl mean: 8.944929122924805 	 loss mean: 153.06146240234375


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
100%|██████████| 10/10 [00:00<00:00, 24.17it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
 30%|███       | 3/10 [00:00<00:00, 24.91it/s][A

nll mean: 143.70620727539062 	 kl mean: 8.944929122924805 	 loss mean: 152.651123046875
nll mean: 132.5523681640625 	 kl mean: 9.277220726013184 	 loss mean: 141.82958984375
nll mean: 133.42352294921875 	 kl mean: 9.277220726013184 	 loss mean: 142.70074462890625
nll mean: 133.20050048828125 	 kl mean: 9.277220726013184 	 loss mean: 142.47772216796875
nll mean: 133.08563232421875 	 kl mean: 9.277220726013184 	 loss mean: 142.36285400390625


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
 30%|███       | 3/10 [00:00<00:00, 24.91it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               [A
 45%|████▍     | 17/38 [00:11<00:13,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.81it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.67it/s][A

nll mean: 133.90208435058594 	 kl mean: 9.277220726013184 	 loss mean: 143.17930603027344
nll mean: 133.52587890625 	 kl mean: 9.277220726013184 	 loss mean: 142.8031005859375
nll mean: 133.0048065185547 	 kl mean: 9.277220726013184 	 loss mean: 142.2820281982422
nll mean: 133.37881469726562 	 kl mean: 9.277220726013184 	 loss mean: 142.65603637695312
nll mean: 132.71197509765625 	 kl mean: 9.277220726013184 	 loss mean: 141.98919677734375


                                               
 45%|████▍     | 17/38 [00:11<00:13,  1.53it/s]
100%|██████████| 10/10 [00:00<00:00, 24.57it/s][A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.40it/s][A

nll mean: 133.15940856933594 	 kl mean: 9.277220726013184 	 loss mean: 142.4366455078125
nll mean: 129.4992218017578 	 kl mean: 10.383888244628906 	 loss mean: 139.88311767578125
nll mean: 129.2623748779297 	 kl mean: 10.383888244628906 	 loss mean: 139.64627075195312


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 20%|██        | 2/10 [00:00<00:00, 12.40it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 40%|████      | 4/10 [00:00<00:00, 12.55it/s][A

nll mean: 129.28106689453125 	 kl mean: 10.383888244628906 	 loss mean: 139.66494750976562
nll mean: 129.580078125 	 kl mean: 10.383888244628906 	 loss mean: 139.9639892578125
nll mean: 129.8671417236328 	 kl mean: 10.383888244628906 	 loss mean: 140.25103759765625


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 40%|████      | 4/10 [00:00<00:00, 12.55it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.67it/s][A

nll mean: 129.57872009277344 	 kl mean: 10.383888244628906 	 loss mean: 139.9626007080078
nll mean: 129.95465087890625 	 kl mean: 10.383888244628906 	 loss mean: 140.33853149414062
nll mean: 129.67193603515625 	 kl mean: 10.383888244628906 	 loss mean: 140.0558319091797


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.67it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.62it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 129.5226593017578 	 kl mean: 10.383888244628906 	 loss mean: 139.9065399169922
nll mean: 129.58511352539062 	 kl mean: 10.383888244628906 	 loss mean: 139.968994140625
nll mean: 148.54566955566406 	 kl mean: 9.777557373046875 	 loss mean: 158.32322692871094


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 12.33it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.39it/s][A

nll mean: 149.08615112304688 	 kl mean: 9.777557373046875 	 loss mean: 158.86370849609375
nll mean: 148.9508819580078 	 kl mean: 9.777557373046875 	 loss mean: 158.7284393310547
nll mean: 148.71287536621094 	 kl mean: 9.777557373046875 	 loss mean: 158.49044799804688


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 40%|████      | 4/10 [00:00<00:00, 12.39it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.36it/s][A

nll mean: 149.0648956298828 	 kl mean: 9.777557373046875 	 loss mean: 158.8424530029297
nll mean: 149.060302734375 	 kl mean: 9.777557373046875 	 loss mean: 158.83786010742188
nll mean: 148.56338500976562 	 kl mean: 9.777557373046875 	 loss mean: 158.3409423828125


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.36it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.36it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.39it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 148.50917053222656 	 kl mean: 9.777557373046875 	 loss mean: 158.28671264648438
nll mean: 148.6278076171875 	 kl mean: 9.777557373046875 	 loss mean: 158.40536499023438
nll mean: 148.51205444335938 	 kl mean: 9.777557373046875 	 loss mean: 158.2896270751953


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 20%|██        | 2/10 [00:00<00:00, 12.70it/s][A

nll mean: 157.30564880371094 	 kl mean: 9.65139389038086 	 loss mean: 166.95704650878906
nll mean: 157.76126098632812 	 kl mean: 9.65139389038086 	 loss mean: 167.41265869140625
nll mean: 156.8876495361328 	 kl mean: 9.65139389038086 	 loss mean: 166.53904724121094


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 20%|██        | 2/10 [00:00<00:00, 12.70it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 40%|████      | 4/10 [00:00<00:00, 12.69it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.73it/s][A

nll mean: 157.71304321289062 	 kl mean: 9.65139389038086 	 loss mean: 167.36444091796875
nll mean: 157.76779174804688 	 kl mean: 9.65139389038086 	 loss mean: 167.41915893554688
nll mean: 157.2315673828125 	 kl mean: 9.65139389038086 	 loss mean: 166.88296508789062


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.73it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.80it/s][A

nll mean: 157.16726684570312 	 kl mean: 9.65139389038086 	 loss mean: 166.81866455078125
nll mean: 157.81443786621094 	 kl mean: 9.65139389038086 	 loss mean: 167.4658203125
nll mean: 157.39697265625 	 kl mean: 9.65139389038086 	 loss mean: 167.04837036132812


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.80it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.73it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
  0%|          | 0/10 [00:00<?, ?it/s]

nll mean: 157.26365661621094 	 kl mean: 9.65139389038086 	 loss mean: 166.91506958007812
nll mean: 117.72942352294922 	 kl mean: 9.828261375427246 	 loss mean: 127.55768585205078
nll mean: 117.81150817871094 	 kl mean: 9.828261375427246 	 loss mean: 127.6397705078125


[A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
 20%|██        | 2/10 [00:00<00:00, 10.21it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.38it/s]
 40%|████      | 4/10 [00:00<00:00, 10.23it/s][A

nll mean: 117.0638427734375 	 kl mean: 9.828261375427246 	 loss mean: 126.89209747314453
nll mean: 117.32035827636719 	 kl mean: 9.828261375427246 	 loss mean: 127.14862060546875
nll mean: 117.53898620605469 	 kl mean: 9.828261375427246 	 loss mean: 127.36724853515625


                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s]
 40%|████      | 4/10 [00:00<00:00, 10.23it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.26it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.27it/s][A

nll mean: 117.46180725097656 	 kl mean: 9.828261375427246 	 loss mean: 127.29006958007812
nll mean: 117.63285827636719 	 kl mean: 9.828261375427246 	 loss mean: 127.46112060546875
nll mean: 117.06968688964844 	 kl mean: 9.828261375427246 	 loss mean: 126.89794158935547


                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.38it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.27it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.28it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 117.40836334228516 	 kl mean: 9.828261375427246 	 loss mean: 127.23661804199219
nll mean: 118.23455810546875 	 kl mean: 9.828261375427246 	 loss mean: 128.0628204345703
nll mean: 106.68879699707031 	 kl mean: 8.116063117980957 	 loss mean: 114.80485534667969
nll mean: 106.5834732055664 	 kl mean: 8.116063117980957 	 loss mean: 114.69953918457031
nll mean: 106.6920166015625 	 kl mean: 8.116063117980957 	 loss mean: 114.80807495117188


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
 40%|████      | 4/10 [00:00<00:00, 33.15it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.25it/s]
100%|██████████| 10/10 [00:00<00:00, 32.64it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 106.31219482421875 	 kl mean: 8.116063117980957 	 loss mean: 114.42825317382812
nll mean: 106.07511138916016 	 kl mean: 8.116063117980957 	 loss mean: 114.19116973876953
nll mean: 106.42422485351562 	 kl mean: 8.116063117980957 	 loss mean: 114.540283203125
nll mean: 107.0308837890625 	 kl mean: 8.116063117980957 	 loss mean: 115.14694213867188
nll mean: 106.19166564941406 	 kl mean: 8.116063117980957 	 loss mean: 114.30772399902344
nll mean: 106.37004089355469 	 kl mean: 8.116063117980957 	 loss mean: 114.48609924316406
nll mean: 106.4478530883789 	 kl mean: 8.116063117980957 	 loss mean: 114.56391906738281


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.54it/s]
 20%|██        | 2/10 [00:00<00:00, 14.48it/s][A

nll mean: 159.0400848388672 	 kl mean: 8.865479469299316 	 loss mean: 167.9055633544922
nll mean: 159.69778442382812 	 kl mean: 8.865479469299316 	 loss mean: 168.56326293945312
nll mean: 159.50711059570312 	 kl mean: 8.865479469299316 	 loss mean: 168.37258911132812


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
 20%|██        | 2/10 [00:00<00:00, 14.48it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
 40%|████      | 4/10 [00:00<00:00, 14.60it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.58it/s][A

nll mean: 159.63084411621094 	 kl mean: 8.865479469299316 	 loss mean: 168.49632263183594
nll mean: 158.93777465820312 	 kl mean: 8.865479469299316 	 loss mean: 167.8032684326172
nll mean: 159.76031494140625 	 kl mean: 8.865479469299316 	 loss mean: 168.62579345703125


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.58it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.65it/s][A

nll mean: 159.3035888671875 	 kl mean: 8.865479469299316 	 loss mean: 168.1690673828125
nll mean: 159.44137573242188 	 kl mean: 8.865479469299316 	 loss mean: 168.3068389892578
nll mean: 159.69387817382812 	 kl mean: 8.865479469299316 	 loss mean: 168.55935668945312


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.54it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.66it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 22.04it/s][A

nll mean: 159.38015747070312 	 kl mean: 8.865479469299316 	 loss mean: 168.24563598632812
nll mean: 119.37557983398438 	 kl mean: 10.055252075195312 	 loss mean: 129.43081665039062
nll mean: 119.65765380859375 	 kl mean: 10.055252075195312 	 loss mean: 129.71290588378906
nll mean: 119.39852142333984 	 kl mean: 10.055252075195312 	 loss mean: 129.4537811279297
nll mean: 119.33355712890625 	 kl mean: 10.055252075195312 	 loss mean: 129.38880920410156


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 22.04it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.92it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.66it/s][A

nll mean: 119.9319839477539 	 kl mean: 10.055252075195312 	 loss mean: 129.98724365234375
nll mean: 119.65043640136719 	 kl mean: 10.055252075195312 	 loss mean: 129.7056884765625
nll mean: 119.34898376464844 	 kl mean: 10.055252075195312 	 loss mean: 129.40423583984375
nll mean: 119.58074188232422 	 kl mean: 10.055252075195312 	 loss mean: 129.635986328125
nll mean: 119.71304321289062 	 kl mean: 10.055252075195312 	 loss mean: 129.76829528808594


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 21.46it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.66it/s]
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.56it/s][A

nll mean: 118.65343475341797 	 kl mean: 10.055252075195312 	 loss mean: 128.70867919921875
nll mean: 113.70453643798828 	 kl mean: 9.024948120117188 	 loss mean: 122.7294921875
nll mean: 113.84626770019531 	 kl mean: 9.024948120117188 	 loss mean: 122.8712158203125


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 20%|██        | 2/10 [00:00<00:00, 14.56it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 40%|████      | 4/10 [00:00<00:00, 14.61it/s][A

nll mean: 113.28118896484375 	 kl mean: 9.024948120117188 	 loss mean: 122.30613708496094
nll mean: 113.93351745605469 	 kl mean: 9.024948120117188 	 loss mean: 122.95846557617188
nll mean: 113.8729019165039 	 kl mean: 9.024948120117188 	 loss mean: 122.8978500366211


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 40%|████      | 4/10 [00:00<00:00, 14.61it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.56it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.60it/s][A

nll mean: 113.84407043457031 	 kl mean: 9.024948120117188 	 loss mean: 122.86902618408203
nll mean: 113.66413116455078 	 kl mean: 9.024948120117188 	 loss mean: 122.6890869140625
nll mean: 113.8238296508789 	 kl mean: 9.024948120117188 	 loss mean: 122.8487777709961


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.66it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.60it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.66it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               


nll mean: 113.99629211425781 	 kl mean: 9.024948120117188 	 loss mean: 123.02123260498047
nll mean: 113.39634704589844 	 kl mean: 9.024948120117188 	 loss mean: 122.42129516601562
nll mean: 82.22586822509766 	 kl mean: 8.26354694366455 	 loss mean: 90.48941040039062
nll mean: 81.83211517333984 	 kl mean: 8.26354694366455 	 loss mean: 90.09565734863281


 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 23.02it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.51it/s][A

nll mean: 82.03662109375 	 kl mean: 8.26354694366455 	 loss mean: 90.3001708984375
nll mean: 82.26283264160156 	 kl mean: 8.26354694366455 	 loss mean: 90.52638244628906
nll mean: 82.2413330078125 	 kl mean: 8.26354694366455 	 loss mean: 90.5048828125
nll mean: 82.07832336425781 	 kl mean: 8.26354694366455 	 loss mean: 90.34187316894531
nll mean: 81.99053955078125 	 kl mean: 8.26354694366455 	 loss mean: 90.25408935546875


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.51it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:17<00:07,  1.59it/s]
100%|██████████| 10/10 [00:00<00:00, 21.92it/s][A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 81.42505645751953 	 kl mean: 8.26354694366455 	 loss mean: 89.6885986328125
nll mean: 81.98658752441406 	 kl mean: 8.26354694366455 	 loss mean: 90.25013732910156
nll mean: 82.11224365234375 	 kl mean: 8.26354694366455 	 loss mean: 90.37579345703125
nll mean: 109.08057403564453 	 kl mean: 8.362582206726074 	 loss mean: 117.44316101074219
nll mean: 108.49637603759766 	 kl mean: 8.362582206726074 	 loss mean: 116.85896301269531


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.65it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.56it/s][A

nll mean: 109.27079772949219 	 kl mean: 8.362582206726074 	 loss mean: 117.63338470458984
nll mean: 108.61007690429688 	 kl mean: 8.362582206726074 	 loss mean: 116.97265625
nll mean: 108.51275634765625 	 kl mean: 8.362582206726074 	 loss mean: 116.87533569335938
nll mean: 108.55006408691406 	 kl mean: 8.362582206726074 	 loss mean: 116.91264343261719
nll mean: 108.45272064208984 	 kl mean: 8.362582206726074 	 loss mean: 116.8153076171875


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.56it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
100%|██████████| 10/10 [00:00<00:00, 21.54it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 108.58751678466797 	 kl mean: 8.362582206726074 	 loss mean: 116.95010375976562
nll mean: 108.693115234375 	 kl mean: 8.362582206726074 	 loss mean: 117.05570220947266
nll mean: 108.84552001953125 	 kl mean: 8.362582206726074 	 loss mean: 117.20809936523438
nll mean: 121.43729400634766 	 kl mean: 9.180821418762207 	 loss mean: 130.6181182861328


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 20%|██        | 2/10 [00:00<00:00, 12.34it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.34it/s][A

nll mean: 121.72040557861328 	 kl mean: 9.180821418762207 	 loss mean: 130.90122985839844
nll mean: 121.93008422851562 	 kl mean: 9.180821418762207 	 loss mean: 131.11090087890625
nll mean: 121.93031311035156 	 kl mean: 9.180821418762207 	 loss mean: 131.1111297607422


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.84it/s]
 40%|████      | 4/10 [00:00<00:00, 12.34it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.30it/s][A

nll mean: 122.00074768066406 	 kl mean: 9.180821418762207 	 loss mean: 131.18157958984375
nll mean: 121.36085510253906 	 kl mean: 9.180821418762207 	 loss mean: 130.54168701171875
nll mean: 121.55357360839844 	 kl mean: 9.180821418762207 	 loss mean: 130.73440551757812


                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.30it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.84it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.33it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.28it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 121.93168640136719 	 kl mean: 9.180821418762207 	 loss mean: 131.11251831054688
nll mean: 122.43144989013672 	 kl mean: 9.180821418762207 	 loss mean: 131.61227416992188
nll mean: 121.24174499511719 	 kl mean: 9.180821418762207 	 loss mean: 130.42254638671875


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.98it/s][A

nll mean: 60.84797668457031 	 kl mean: 10.428858757019043 	 loss mean: 71.2768325805664
nll mean: 61.124053955078125 	 kl mean: 10.428858757019043 	 loss mean: 71.55290985107422


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 20%|██        | 2/10 [00:00<00:00,  9.98it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 30%|███       | 3/10 [00:00<00:00,  9.97it/s][A

nll mean: 60.492523193359375 	 kl mean: 10.428858757019043 	 loss mean: 70.92138671875
nll mean: 61.282920837402344 	 kl mean: 10.428858757019043 	 loss mean: 71.71177673339844
nll mean: 61.35049057006836 	 kl mean: 10.428858757019043 	 loss mean: 71.77934265136719



                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.00it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s]
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.93it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.00it/s][A

nll mean: 61.30949783325195 	 kl mean: 10.428858757019043 	 loss mean: 71.73835754394531
nll mean: 60.874267578125 	 kl mean: 10.428858757019043 	 loss mean: 71.30313110351562
nll mean: 61.21857452392578 	 kl mean: 10.428858757019043 	 loss mean: 71.64743041992188


                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s]
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.00it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.04it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 60.93457794189453 	 kl mean: 10.428858757019043 	 loss mean: 71.36343383789062
nll mean: 61.45366287231445 	 kl mean: 10.428858757019043 	 loss mean: 71.88252258300781
nll mean: 104.20021057128906 	 kl mean: 9.93796443939209 	 loss mean: 114.13817596435547


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 20%|██        | 2/10 [00:00<00:00, 13.30it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.04it/s][A

nll mean: 104.76663208007812 	 kl mean: 9.93796443939209 	 loss mean: 114.70458984375
nll mean: 104.21984100341797 	 kl mean: 9.93796443939209 	 loss mean: 114.15780639648438
nll mean: 103.9568862915039 	 kl mean: 9.93796443939209 	 loss mean: 113.89485931396484


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 40%|████      | 4/10 [00:00<00:00, 13.04it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.84it/s][A

nll mean: 103.31976318359375 	 kl mean: 9.93796443939209 	 loss mean: 113.25773620605469
nll mean: 104.23406982421875 	 kl mean: 9.93796443939209 	 loss mean: 114.17204284667969
nll mean: 104.03679656982422 	 kl mean: 9.93796443939209 	 loss mean: 113.97476196289062


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.84it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:20<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:20<00:05,  1.36it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.72it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.60it/s][A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 104.04421997070312 	 kl mean: 9.93796443939209 	 loss mean: 113.982177734375
nll mean: 104.0782470703125 	 kl mean: 9.93796443939209 	 loss mean: 114.0162124633789
nll mean: 104.66661071777344 	 kl mean: 9.93796443939209 	 loss mean: 114.60457611083984


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.07it/s][A

nll mean: 137.9935302734375 	 kl mean: 9.93962287902832 	 loss mean: 147.93316650390625
nll mean: 137.277099609375 	 kl mean: 9.93962287902832 	 loss mean: 147.2167205810547


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 20%|██        | 2/10 [00:00<00:00, 10.07it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00,  9.97it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.92it/s][A

nll mean: 137.72817993164062 	 kl mean: 9.93962287902832 	 loss mean: 147.66781616210938
nll mean: 138.37667846679688 	 kl mean: 9.93962287902832 	 loss mean: 148.3162841796875


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 40%|████      | 4/10 [00:00<00:00,  9.92it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.80it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.79it/s][A

nll mean: 138.20443725585938 	 kl mean: 9.93962287902832 	 loss mean: 148.14405822753906
nll mean: 138.08740234375 	 kl mean: 9.93962287902832 	 loss mean: 148.0270233154297


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.79it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.82it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.83it/s][A

nll mean: 138.022216796875 	 kl mean: 9.93962287902832 	 loss mean: 147.96185302734375
nll mean: 137.72079467773438 	 kl mean: 9.93962287902832 	 loss mean: 147.66041564941406


                                               
 82%|████████▏ | 31/38 [00:21<00:05,  1.32it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.83it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:21<00:05,  1.32it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.85it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.84it/s][A
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 137.70465087890625 	 kl mean: 9.93962287902832 	 loss mean: 147.64425659179688
nll mean: 137.6219024658203 	 kl mean: 9.93962287902832 	 loss mean: 147.5615234375
nll mean: 63.278526306152344 	 kl mean: 9.036154747009277 	 loss mean: 72.31468200683594
nll mean: 62.81999206542969 	 kl mean: 9.036154747009277 	 loss mean: 71.85614013671875


                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
 30%|███       | 3/10 [00:00<00:00, 25.90it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]

nll mean: 62.65879821777344 	 kl mean: 9.036154747009277 	 loss mean: 71.69495391845703
nll mean: 63.25210952758789 	 kl mean: 9.036154747009277 	 loss mean: 72.28826904296875
nll mean: 62.49336242675781 	 kl mean: 9.036154747009277 	 loss mean: 71.5295181274414
nll mean: 62.595123291015625 	 kl mean: 9.036154747009277 	 loss mean: 71.63127899169922
nll mean: 62.85247802734375 	 kl mean: 9.036154747009277 	 loss mean: 71.88863372802734
nll mean: 62.34495162963867 	 kl mean: 9.036154747009277 	 loss mean: 71.381103515625



                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.61it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
100%|██████████| 10/10 [00:00<00:00, 25.39it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 22.07it/s][A

nll mean: 63.077762603759766 	 kl mean: 9.036154747009277 	 loss mean: 72.11392211914062
nll mean: 63.1400146484375 	 kl mean: 9.036154747009277 	 loss mean: 72.1761703491211
nll mean: 119.57330322265625 	 kl mean: 8.503656387329102 	 loss mean: 128.07696533203125
nll mean: 119.2083740234375 	 kl mean: 8.503656387329102 	 loss mean: 127.71202087402344
nll mean: 119.4974594116211 	 kl mean: 8.503656387329102 	 loss mean: 128.00112915039062


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
 30%|███       | 3/10 [00:00<00:00, 22.07it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.79it/s][A

nll mean: 119.16958618164062 	 kl mean: 8.503656387329102 	 loss mean: 127.67323303222656
nll mean: 118.86083221435547 	 kl mean: 8.503656387329102 	 loss mean: 127.36448669433594
nll mean: 119.43946838378906 	 kl mean: 8.503656387329102 	 loss mean: 127.94312286376953
nll mean: 118.95628356933594 	 kl mean: 8.503656387329102 	 loss mean: 127.4599380493164
nll mean: 118.84181213378906 	 kl mean: 8.503656387329102 	 loss mean: 127.34546661376953


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.79it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
100%|██████████| 10/10 [00:00<00:00, 21.51it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.87926483154297 	 kl mean: 8.503656387329102 	 loss mean: 127.38291931152344
nll mean: 119.318115234375 	 kl mean: 8.503656387329102 	 loss mean: 127.82177734375
nll mean: 118.14849853515625 	 kl mean: 9.932378768920898 	 loss mean: 128.08087158203125


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.32it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.38it/s][A

nll mean: 119.21973419189453 	 kl mean: 9.932378768920898 	 loss mean: 129.152099609375
nll mean: 119.17681884765625 	 kl mean: 9.932378768920898 	 loss mean: 129.10919189453125
nll mean: 119.17622375488281 	 kl mean: 9.932378768920898 	 loss mean: 129.10861206054688


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 40%|████      | 4/10 [00:00<00:00, 12.38it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.34it/s][A

nll mean: 118.90635681152344 	 kl mean: 9.932378768920898 	 loss mean: 128.83872985839844
nll mean: 118.38534545898438 	 kl mean: 9.932378768920898 	 loss mean: 128.31771850585938
nll mean: 118.6461410522461 	 kl mean: 9.932378768920898 	 loss mean: 128.57852172851562


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.34it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.35it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.37it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.36508178710938 	 kl mean: 9.932378768920898 	 loss mean: 128.29745483398438
nll mean: 118.51731872558594 	 kl mean: 9.932378768920898 	 loss mean: 128.44970703125
nll mean: 119.36949920654297 	 kl mean: 9.932378768920898 	 loss mean: 129.3018798828125


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.61it/s][A

nll mean: 113.51031494140625 	 kl mean: 9.131576538085938 	 loss mean: 122.64189147949219
nll mean: 113.8251953125 	 kl mean: 9.131576538085938 	 loss mean: 122.95677185058594
nll mean: 113.404296875 	 kl mean: 9.131576538085938 	 loss mean: 122.53587341308594


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.61it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 10.59it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.60it/s][A

nll mean: 113.71217346191406 	 kl mean: 9.131576538085938 	 loss mean: 122.84375
nll mean: 113.1205062866211 	 kl mean: 9.131576538085938 	 loss mean: 122.25209045410156
nll mean: 113.77889251708984 	 kl mean: 9.131576538085938 	 loss mean: 122.91046142578125


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.60it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.59it/s][A

nll mean: 113.36351776123047 	 kl mean: 9.131576538085938 	 loss mean: 122.4950942993164
nll mean: 113.60057830810547 	 kl mean: 9.131576538085938 	 loss mean: 122.73214721679688
nll mean: 113.22029113769531 	 kl mean: 9.131576538085938 	 loss mean: 122.35186767578125


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.59it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.59it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 22.27it/s][A

nll mean: 113.22004699707031 	 kl mean: 9.131576538085938 	 loss mean: 122.35163116455078
nll mean: 111.2992935180664 	 kl mean: 9.185742378234863 	 loss mean: 120.48503875732422
nll mean: 111.22830200195312 	 kl mean: 9.185742378234863 	 loss mean: 120.41404724121094
nll mean: 111.41304779052734 	 kl mean: 9.185742378234863 	 loss mean: 120.59879302978516
nll mean: 111.45484161376953 	 kl mean: 9.185742378234863 	 loss mean: 120.64058685302734


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 22.27it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
 50%|█████     | 5/10 [00:00<00:00, 21.26it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
 80%|████████  | 8/10 [00:00<00:00, 21.22it/s][A

nll mean: 111.30838775634766 	 kl mean: 9.185742378234863 	 loss mean: 120.49413299560547
nll mean: 110.7623291015625 	 kl mean: 9.185742378234863 	 loss mean: 119.94807434082031
nll mean: 111.23487854003906 	 kl mean: 9.185742378234863 	 loss mean: 120.42062377929688
nll mean: 111.02214050292969 	 kl mean: 9.185742378234863 	 loss mean: 120.20787811279297
nll mean: 111.26822662353516 	 kl mean: 9.185742378234863 	 loss mean: 120.45397186279297


                                               
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
100%|██████████| 10/10 [00:00<00:00, 21.13it/s][A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 30.87it/s][A

nll mean: 111.67142486572266 	 kl mean: 9.185742378234863 	 loss mean: 120.857177734375
nll mean: 83.74434661865234 	 kl mean: 10.75776481628418 	 loss mean: 94.50212097167969
nll mean: 83.92791748046875 	 kl mean: 10.75776481628418 	 loss mean: 94.68568420410156
nll mean: 83.40679168701172 	 kl mean: 10.75776481628418 	 loss mean: 94.16455078125
nll mean: 83.74186706542969 	 kl mean: 10.75776481628418 	 loss mean: 94.49962615966797
nll mean: 83.66938781738281 	 kl mean: 10.75776481628418 	 loss mean: 94.4271469116211
nll mean: 83.46317291259766 	 kl mean: 10.75776481628418 	 loss mean: 94.22093963623047


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 30.87it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
100%|██████████| 10/10 [00:00<00:00, 30.31it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.55it/s]


nll mean: 83.64277648925781 	 kl mean: 10.75776481628418 	 loss mean: 94.4005355834961
nll mean: 83.75682067871094 	 kl mean: 10.75776481628418 	 loss mean: 94.51458740234375
nll mean: 83.38176727294922 	 kl mean: 10.75776481628418 	 loss mean: 94.13954162597656
nll mean: 83.12255859375 	 kl mean: 10.75776481628418 	 loss mean: 93.88031005859375
Approximate NLL:
tensor(121.1414, device='cuda:0')
Approximate KL:
tensor(9.4737, device='cuda:0')
Testing took 0:00:25.560028


  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
                                      [A
  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      .75it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .75it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.75it/s][A

nll mean: 108.59734344482422 	 kl mean: 10.26249885559082 	 loss mean: 118.85984802246094
nll mean: 107.63687133789062 	 kl mean: 10.26249885559082 	 loss mean: 117.89936828613281
nll mean: 107.17649841308594 	 kl mean: 10.26249885559082 	 loss mean: 117.43899536132812
nll mean: 107.42503356933594 	 kl mean: 10.26249885559082 	 loss mean: 117.68753814697266
nll mean: 107.84661865234375 	 kl mean: 10.26249885559082 	 loss mean: 118.109130859375


                                      
  0%|          | 0/38 [00:00<?, ?it/s]        
 30%|███       | 3/10 [00:00<00:00, 25.75it/s][A
                                      .40it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .40it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
                                      .40it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
 60%|██████    | 6/10 [00:00<00:00, 25.40it/s][A
                                      .04it/s][A
  0%|          | 0/38 [00:00<?, ?it/s]        
100%|██████████| 10/10 [00:00<00:00, 24.81it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 108.60018157958984 	 kl mean: 10.26249885559082 	 loss mean: 118.86268615722656
nll mean: 107.52777099609375 	 kl mean: 10.26249885559082 	 loss mean: 117.79027557373047
nll mean: 107.74710845947266 	 kl mean: 10.26249885559082 	 loss mean: 118.00961303710938
nll mean: 108.02828979492188 	 kl mean: 10.26249885559082 	 loss mean: 118.29078674316406
nll mean: 108.00328063964844 	 kl mean: 10.26249885559082 	 loss mean: 118.26579284667969


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 20%|██        | 2/10 [00:00<00:00, 13.64it/s][A

nll mean: 125.260498046875 	 kl mean: 9.99409294128418 	 loss mean: 135.2545928955078
nll mean: 125.27815246582031 	 kl mean: 9.99409294128418 	 loss mean: 135.27224731445312
nll mean: 125.91297149658203 	 kl mean: 9.99409294128418 	 loss mean: 135.90707397460938


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 20%|██        | 2/10 [00:00<00:00, 13.64it/s][A
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 40%|████      | 4/10 [00:00<00:00, 13.81it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.05it/s][A

nll mean: 125.37260437011719 	 kl mean: 9.99409294128418 	 loss mean: 135.36669921875
nll mean: 125.64285278320312 	 kl mean: 9.99409294128418 	 loss mean: 135.63694763183594
nll mean: 125.63323974609375 	 kl mean: 9.99409294128418 	 loss mean: 135.62733459472656


                                              
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
                                              [A
  3%|▎         | 1/38 [00:00<00:14,  2.47it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.05it/s][A
                                              [A
  3%|▎         | 1/38 [00:01<00:14,  2.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.00it/s][A

nll mean: 124.96788024902344 	 kl mean: 9.99409294128418 	 loss mean: 134.96197509765625
nll mean: 125.22271728515625 	 kl mean: 9.99409294128418 	 loss mean: 135.21681213378906
nll mean: 125.33334350585938 	 kl mean: 9.99409294128418 	 loss mean: 135.3274383544922


                                              
  3%|▎         | 1/38 [00:01<00:14,  2.47it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.00it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.03it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 24.29it/s][A

nll mean: 125.59678649902344 	 kl mean: 9.99409294128418 	 loss mean: 135.59088134765625
nll mean: 96.85453796386719 	 kl mean: 9.157861709594727 	 loss mean: 106.01239013671875
nll mean: 96.83979797363281 	 kl mean: 9.157861709594727 	 loss mean: 105.9976577758789
nll mean: 97.0516128540039 	 kl mean: 9.157861709594727 	 loss mean: 106.20947265625
nll mean: 97.23094177246094 	 kl mean: 9.157861709594727 	 loss mean: 106.38880920410156


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 24.29it/s][A
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              [A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.17it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.10it/s][A

nll mean: 97.17288208007812 	 kl mean: 9.157861709594727 	 loss mean: 106.33074188232422
nll mean: 97.2297592163086 	 kl mean: 9.157861709594727 	 loss mean: 106.38761901855469
nll mean: 97.37448120117188 	 kl mean: 9.157861709594727 	 loss mean: 106.5323486328125
nll mean: 97.40843200683594 	 kl mean: 9.157861709594727 	 loss mean: 106.56629943847656
nll mean: 96.9385986328125 	 kl mean: 9.157861709594727 	 loss mean: 106.09646606445312


                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
100%|██████████| 10/10 [00:00<00:00, 24.09it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.67it/s][A

nll mean: 97.03240966796875 	 kl mean: 9.157861709594727 	 loss mean: 106.19027709960938
nll mean: 136.95077514648438 	 kl mean: 9.963366508483887 	 loss mean: 146.91415405273438
nll mean: 137.8639678955078 	 kl mean: 9.963366508483887 	 loss mean: 147.82733154296875


                                              
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s]
                                              [A
  8%|▊         | 3/38 [00:01<00:16,  2.11it/s]
 20%|██        | 2/10 [00:00<00:00, 10.67it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s]
 40%|████      | 4/10 [00:00<00:00, 10.71it/s][A

nll mean: 137.73263549804688 	 kl mean: 9.963366508483887 	 loss mean: 147.6959991455078
nll mean: 137.66981506347656 	 kl mean: 9.963366508483887 	 loss mean: 147.6331787109375
nll mean: 137.83114624023438 	 kl mean: 9.963366508483887 	 loss mean: 147.79452514648438


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s]
 40%|████      | 4/10 [00:00<00:00, 10.71it/s][A
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.75it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.74it/s][A

nll mean: 138.06854248046875 	 kl mean: 9.963366508483887 	 loss mean: 148.03189086914062
nll mean: 137.49432373046875 	 kl mean: 9.963366508483887 	 loss mean: 147.45770263671875
nll mean: 137.76577758789062 	 kl mean: 9.963366508483887 	 loss mean: 147.72914123535156


                                              
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s]
                                              [A
  8%|▊         | 3/38 [00:02<00:16,  2.11it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.74it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.77it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 137.62020874023438 	 kl mean: 9.963366508483887 	 loss mean: 147.5835723876953
nll mean: 138.07086181640625 	 kl mean: 9.963366508483887 	 loss mean: 148.03421020507812
nll mean: 125.6245346069336 	 kl mean: 9.474397659301758 	 loss mean: 135.09893798828125


                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 20%|██        | 2/10 [00:00<00:00, 14.11it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.01it/s][A

nll mean: 125.36844635009766 	 kl mean: 9.474397659301758 	 loss mean: 134.84283447265625
nll mean: 125.42750549316406 	 kl mean: 9.474397659301758 	 loss mean: 134.90191650390625
nll mean: 125.72884368896484 	 kl mean: 9.474397659301758 	 loss mean: 135.2032470703125


                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 40%|████      | 4/10 [00:00<00:00, 14.01it/s][A
                                              [A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.99it/s][A

nll mean: 125.3004379272461 	 kl mean: 9.474397659301758 	 loss mean: 134.77484130859375
nll mean: 125.27727508544922 	 kl mean: 9.474397659301758 	 loss mean: 134.75167846679688
nll mean: 126.04708099365234 	 kl mean: 9.474397659301758 	 loss mean: 135.521484375


                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
 60%|██████    | 6/10 [00:00<00:00, 13.99it/s][A
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
                                              [A
 11%|█         | 4/38 [00:03<00:20,  1.64it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.03it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.03it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 125.24089050292969 	 kl mean: 9.474397659301758 	 loss mean: 134.71530151367188
nll mean: 125.12242126464844 	 kl mean: 9.474397659301758 	 loss mean: 134.59683227539062
nll mean: 125.56185913085938 	 kl mean: 9.474397659301758 	 loss mean: 135.0362548828125


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.24it/s][A

nll mean: 123.05917358398438 	 kl mean: 9.339832305908203 	 loss mean: 132.3990020751953
nll mean: 122.16311645507812 	 kl mean: 9.339832305908203 	 loss mean: 131.50296020507812
nll mean: 122.0488510131836 	 kl mean: 9.339832305908203 	 loss mean: 131.388671875


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.24it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 40%|████      | 4/10 [00:00<00:00, 14.23it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.15it/s][A

nll mean: 122.12557983398438 	 kl mean: 9.339832305908203 	 loss mean: 131.4654083251953
nll mean: 122.29531860351562 	 kl mean: 9.339832305908203 	 loss mean: 131.63516235351562
nll mean: 122.3506851196289 	 kl mean: 9.339832305908203 	 loss mean: 131.69052124023438


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.15it/s][A
                                              [A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.08it/s][A

nll mean: 122.12258911132812 	 kl mean: 9.339832305908203 	 loss mean: 131.46241760253906
nll mean: 122.4666519165039 	 kl mean: 9.339832305908203 	 loss mean: 131.80648803710938
nll mean: 122.29359436035156 	 kl mean: 9.339832305908203 	 loss mean: 131.6334228515625


                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.08it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.08it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.44it/s][A

nll mean: 121.94202423095703 	 kl mean: 9.339832305908203 	 loss mean: 131.2818603515625
nll mean: 132.79815673828125 	 kl mean: 9.359054565429688 	 loss mean: 142.15719604492188
nll mean: 132.58200073242188 	 kl mean: 9.359054565429688 	 loss mean: 141.94107055664062
nll mean: 133.20074462890625 	 kl mean: 9.359054565429688 	 loss mean: 142.55979919433594
nll mean: 133.24032592773438 	 kl mean: 9.359054565429688 	 loss mean: 142.59938049316406


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.44it/s][A
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
                                              [A
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.23it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.05it/s][A

nll mean: 133.11293029785156 	 kl mean: 9.359054565429688 	 loss mean: 142.47198486328125
nll mean: 132.86209106445312 	 kl mean: 9.359054565429688 	 loss mean: 142.2211456298828
nll mean: 133.01852416992188 	 kl mean: 9.359054565429688 	 loss mean: 142.3775634765625
nll mean: 132.83004760742188 	 kl mean: 9.359054565429688 	 loss mean: 142.18910217285156
nll mean: 132.7796630859375 	 kl mean: 9.359054565429688 	 loss mean: 142.13870239257812


                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 24.87it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 25.01it/s][A

nll mean: 133.2338104248047 	 kl mean: 9.359054565429688 	 loss mean: 142.59286499023438
nll mean: 105.66166687011719 	 kl mean: 9.542561531066895 	 loss mean: 115.20423126220703
nll mean: 105.53007507324219 	 kl mean: 9.542561531066895 	 loss mean: 115.07262420654297
nll mean: 104.9939193725586 	 kl mean: 9.542561531066895 	 loss mean: 114.53648376464844
nll mean: 105.34934997558594 	 kl mean: 9.542561531066895 	 loss mean: 114.89192199707031


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 25.01it/s][A
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              [A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.79it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.50it/s][A

nll mean: 105.3858642578125 	 kl mean: 9.542561531066895 	 loss mean: 114.92842102050781
nll mean: 105.52780151367188 	 kl mean: 9.542561531066895 	 loss mean: 115.07035827636719
nll mean: 105.31122589111328 	 kl mean: 9.542561531066895 	 loss mean: 114.8537826538086
nll mean: 105.74051666259766 	 kl mean: 9.542561531066895 	 loss mean: 115.2830810546875
nll mean: 105.01286315917969 	 kl mean: 9.542561531066895 	 loss mean: 114.555419921875


                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
100%|██████████| 10/10 [00:00<00:00, 24.37it/s][A
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.27it/s][A

nll mean: 105.31448364257812 	 kl mean: 9.542561531066895 	 loss mean: 114.85704040527344
nll mean: 129.58975219726562 	 kl mean: 10.294837951660156 	 loss mean: 139.88458251953125
nll mean: 130.00686645507812 	 kl mean: 10.294837951660156 	 loss mean: 140.30169677734375


                                              
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
                                              [A
 21%|██        | 8/38 [00:04<00:16,  1.87it/s]
 20%|██        | 2/10 [00:00<00:00, 14.27it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 40%|████      | 4/10 [00:00<00:00, 14.43it/s][A

nll mean: 129.998046875 	 kl mean: 10.294837951660156 	 loss mean: 140.2928924560547
nll mean: 129.57778930664062 	 kl mean: 10.294837951660156 	 loss mean: 139.8726348876953
nll mean: 129.75289916992188 	 kl mean: 10.294837951660156 	 loss mean: 140.0477294921875
nll mean: 129.9131317138672 	 kl mean: 10.294837951660156 	 loss mean: 140.2079620361328



                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.60it/s][A
                                              [A
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.34it/s][A

nll mean: 129.75767517089844 	 kl mean: 10.294837951660156 	 loss mean: 140.05252075195312
nll mean: 130.04568481445312 	 kl mean: 10.294837951660156 	 loss mean: 140.3405303955078
nll mean: 129.25230407714844 	 kl mean: 10.294837951660156 	 loss mean: 139.54714965820312


                                              
 21%|██        | 8/38 [00:05<00:16,  1.87it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.34it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.47it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.72it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.72it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.72it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.72it/s]
 30%|███       | 3/10 [00:00<00:00, 21.63it/s][A

nll mean: 129.8085479736328 	 kl mean: 10.294837951660156 	 loss mean: 140.10337829589844
nll mean: 129.65866088867188 	 kl mean: 9.922172546386719 	 loss mean: 139.58082580566406
nll mean: 129.54437255859375 	 kl mean: 9.922172546386719 	 loss mean: 139.46653747558594
nll mean: 129.87049865722656 	 kl mean: 9.922172546386719 	 loss mean: 139.79266357421875
nll mean: 129.5917205810547 	 kl mean: 9.922172546386719 	 loss mean: 139.51388549804688


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.72it/s]
 30%|███       | 3/10 [00:00<00:00, 21.63it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.72it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.72it/s]
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.72it/s]
 50%|█████     | 5/10 [00:00<00:00, 21.06it/s][A
                                              [A
 24%|██▎       | 9/38 [00:05<00:16,  1.72it/s]
 80%|████████  | 8/10 [00:00<00:00, 21.03it/s][A

nll mean: 129.92897033691406 	 kl mean: 9.922172546386719 	 loss mean: 139.85113525390625
nll mean: 129.5149383544922 	 kl mean: 9.922172546386719 	 loss mean: 139.43710327148438
nll mean: 129.19073486328125 	 kl mean: 9.922172546386719 	 loss mean: 139.11289978027344
nll mean: 129.25442504882812 	 kl mean: 9.922172546386719 	 loss mean: 139.1765899658203
nll mean: 129.92611694335938 	 kl mean: 9.922172546386719 	 loss mean: 139.84829711914062


                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.72it/s]
100%|██████████| 10/10 [00:00<00:00, 20.96it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.81it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.81it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.81it/s]
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.81it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.81it/s]
 30%|███       | 3/10 [00:00<00:00, 24.93it/s][A

nll mean: 129.55120849609375 	 kl mean: 9.922172546386719 	 loss mean: 139.473388671875
nll mean: 117.36518859863281 	 kl mean: 10.122591972351074 	 loss mean: 127.48777770996094
nll mean: 118.16952514648438 	 kl mean: 10.122591972351074 	 loss mean: 128.2921142578125
nll mean: 118.22152709960938 	 kl mean: 10.122591972351074 	 loss mean: 128.3441162109375
nll mean: 118.39393615722656 	 kl mean: 10.122591972351074 	 loss mean: 128.51654052734375


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.81it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.81it/s]
 30%|███       | 3/10 [00:00<00:00, 24.93it/s][A
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.81it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.81it/s]
                                               [A
 26%|██▋       | 10/38 [00:06<00:15,  1.81it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.78it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.69it/s][A

nll mean: 118.30818176269531 	 kl mean: 10.122591972351074 	 loss mean: 128.43077087402344
nll mean: 117.88810729980469 	 kl mean: 10.122591972351074 	 loss mean: 128.01071166992188
nll mean: 117.48583984375 	 kl mean: 10.122591972351074 	 loss mean: 127.60844421386719
nll mean: 117.99601745605469 	 kl mean: 10.122591972351074 	 loss mean: 128.1186065673828
nll mean: 118.04945373535156 	 kl mean: 10.122591972351074 	 loss mean: 128.17205810546875


                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.81it/s]
100%|██████████| 10/10 [00:00<00:00, 24.53it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
 30%|███       | 3/10 [00:00<00:00, 21.15it/s][A

nll mean: 118.41986083984375 	 kl mean: 10.122591972351074 	 loss mean: 128.54244995117188
nll mean: 140.00045776367188 	 kl mean: 10.022830963134766 	 loss mean: 150.02328491210938
nll mean: 140.51339721679688 	 kl mean: 10.022830963134766 	 loss mean: 150.53622436523438
nll mean: 139.9087371826172 	 kl mean: 10.022830963134766 	 loss mean: 149.9315643310547
nll mean: 140.78952026367188 	 kl mean: 10.022830963134766 	 loss mean: 150.81234741210938


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
 30%|███       | 3/10 [00:00<00:00, 21.15it/s][A
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               [A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.09it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.05it/s][A

nll mean: 140.42257690429688 	 kl mean: 10.022830963134766 	 loss mean: 150.44540405273438
nll mean: 140.7210693359375 	 kl mean: 10.022830963134766 	 loss mean: 150.743896484375
nll mean: 140.6043701171875 	 kl mean: 10.022830963134766 	 loss mean: 150.62721252441406
nll mean: 140.62893676757812 	 kl mean: 10.022830963134766 	 loss mean: 150.65176391601562
nll mean: 140.93638610839844 	 kl mean: 10.022830963134766 	 loss mean: 150.95921325683594


                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
100%|██████████| 10/10 [00:00<00:00, 20.85it/s][A
 32%|███▏      | 12/38 [00:06<00:13,  2.00it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:13,  2.00it/s]
                                               
 32%|███▏      | 12/38 [00:06<00:13,  2.00it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.43it/s][A

nll mean: 140.10272216796875 	 kl mean: 10.022830963134766 	 loss mean: 150.12554931640625
nll mean: 119.31732177734375 	 kl mean: 10.424245834350586 	 loss mean: 129.7415771484375
nll mean: 118.73564147949219 	 kl mean: 10.424245834350586 	 loss mean: 129.15989685058594


                                               
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s]
 20%|██        | 2/10 [00:00<00:00, 12.43it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s]
 40%|████      | 4/10 [00:00<00:00, 12.50it/s][A

nll mean: 119.31517028808594 	 kl mean: 10.424245834350586 	 loss mean: 129.73941040039062
nll mean: 118.66397094726562 	 kl mean: 10.424245834350586 	 loss mean: 129.08822631835938
nll mean: 119.361572265625 	 kl mean: 10.424245834350586 	 loss mean: 129.78582763671875


                                               
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s]
 40%|████      | 4/10 [00:00<00:00, 12.50it/s][A
                                               [A
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.57it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.48it/s][A

nll mean: 119.14991760253906 	 kl mean: 10.424245834350586 	 loss mean: 129.57415771484375
nll mean: 118.87203979492188 	 kl mean: 10.424245834350586 	 loss mean: 129.29627990722656
nll mean: 119.12539672851562 	 kl mean: 10.424245834350586 	 loss mean: 129.54965209960938


                                               
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s]
                                               [A
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.48it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.46it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.69it/s]
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.69it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.86358642578125 	 kl mean: 10.424245834350586 	 loss mean: 129.28782653808594
nll mean: 119.43290710449219 	 kl mean: 10.424245834350586 	 loss mean: 129.85714721679688
nll mean: 161.62249755859375 	 kl mean: 10.76314926147461 	 loss mean: 172.38563537597656


                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.69it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 34%|███▍      | 13/38 [00:07<00:14,  1.69it/s]
 20%|██        | 2/10 [00:00<00:00,  9.96it/s][A
                                               [A

nll mean: 161.61453247070312 	 kl mean: 10.76314926147461 	 loss mean: 172.37770080566406
nll mean: 161.7539825439453 	 kl mean: 10.76314926147461 	 loss mean: 172.5171356201172



 34%|███▍      | 13/38 [00:07<00:14,  1.69it/s]
 30%|███       | 3/10 [00:00<00:00,  9.97it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.69it/s]
 40%|████      | 4/10 [00:00<00:00,  9.93it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.91it/s][A

nll mean: 161.64219665527344 	 kl mean: 10.76314926147461 	 loss mean: 172.40533447265625
nll mean: 160.89852905273438 	 kl mean: 10.76314926147461 	 loss mean: 171.66168212890625


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.69it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.91it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.69it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.88it/s][A
                                               [A


nll mean: 161.49166870117188 	 kl mean: 10.76314926147461 	 loss mean: 172.25482177734375
nll mean: 161.35345458984375 	 kl mean: 10.76314926147461 	 loss mean: 172.1165771484375


 34%|███▍      | 13/38 [00:08<00:14,  1.69it/s]
 70%|███████   | 7/10 [00:00<00:00,  9.89it/s][A
                                               [A
 34%|███▍      | 13/38 [00:08<00:14,  1.69it/s]
 80%|████████  | 8/10 [00:00<00:00,  9.90it/s][A
                                               [A


nll mean: 161.18199157714844 	 kl mean: 10.76314926147461 	 loss mean: 171.94515991210938
nll mean: 161.5904998779297 	 kl mean: 10.76314926147461 	 loss mean: 172.35365295410156


 34%|███▍      | 13/38 [00:08<00:14,  1.69it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.91it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.90it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s]
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 18.25it/s][A

nll mean: 161.35733032226562 	 kl mean: 10.76314926147461 	 loss mean: 172.1204833984375
nll mean: 134.82864379882812 	 kl mean: 9.357975006103516 	 loss mean: 144.18663024902344
nll mean: 134.9038543701172 	 kl mean: 9.357975006103516 	 loss mean: 144.26182556152344
nll mean: 134.22119140625 	 kl mean: 9.357975006103516 	 loss mean: 143.57916259765625


                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 18.25it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s]
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s]
 40%|████      | 4/10 [00:00<00:00, 18.03it/s][A
                                               [A
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s]
 60%|██████    | 6/10 [00:00<00:00, 17.83it/s][A

nll mean: 135.0281524658203 	 kl mean: 9.357975006103516 	 loss mean: 144.3861083984375
nll mean: 134.46337890625 	 kl mean: 9.357975006103516 	 loss mean: 143.82135009765625
nll mean: 134.84820556640625 	 kl mean: 9.357975006103516 	 loss mean: 144.2061767578125
nll mean: 134.6710205078125 	 kl mean: 9.357975006103516 	 loss mean: 144.02899169921875


                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.39it/s]
 60%|██████    | 6/10 [00:00<00:00, 17.83it/s][A
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.39it/s]
                                               [A
 37%|███▋      | 14/38 [00:09<00:17,  1.39it/s]
 80%|████████  | 8/10 [00:00<00:00, 17.76it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.60it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 134.33407592773438 	 kl mean: 9.357975006103516 	 loss mean: 143.69204711914062
nll mean: 134.6343536376953 	 kl mean: 9.357975006103516 	 loss mean: 143.99234008789062
nll mean: 134.9761505126953 	 kl mean: 9.357975006103516 	 loss mean: 144.33412170410156


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 10.64it/s][A

nll mean: 142.2894744873047 	 kl mean: 10.436187744140625 	 loss mean: 152.72567749023438
nll mean: 142.2716827392578 	 kl mean: 10.436187744140625 	 loss mean: 152.70787048339844
nll mean: 142.13546752929688 	 kl mean: 10.436187744140625 	 loss mean: 152.5716552734375


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
 20%|██        | 2/10 [00:00<00:00, 10.64it/s][A
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 10.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.66it/s][A

nll mean: 142.75494384765625 	 kl mean: 10.436187744140625 	 loss mean: 153.19113159179688
nll mean: 142.0318145751953 	 kl mean: 10.436187744140625 	 loss mean: 152.46800231933594
nll mean: 142.5040740966797 	 kl mean: 10.436187744140625 	 loss mean: 152.9402618408203


                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
                                               [A
 39%|███▉      | 15/38 [00:09<00:15,  1.48it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.66it/s][A
                                               [A
 39%|███▉      | 15/38 [00:10<00:15,  1.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.63it/s][A

nll mean: 142.52578735351562 	 kl mean: 10.436187744140625 	 loss mean: 152.96197509765625
nll mean: 142.4493408203125 	 kl mean: 10.436187744140625 	 loss mean: 152.88551330566406
nll mean: 142.6036376953125 	 kl mean: 10.436187744140625 	 loss mean: 153.03981018066406


                                               
 39%|███▉      | 15/38 [00:10<00:15,  1.48it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.63it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.61it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00, 24.94it/s][A

nll mean: 142.7071533203125 	 kl mean: 10.436187744140625 	 loss mean: 153.14334106445312
nll mean: 144.90048217773438 	 kl mean: 9.236011505126953 	 loss mean: 154.13648986816406
nll mean: 145.20797729492188 	 kl mean: 9.236011505126953 	 loss mean: 154.44400024414062
nll mean: 144.6891326904297 	 kl mean: 9.236011505126953 	 loss mean: 153.92514038085938
nll mean: 145.08001708984375 	 kl mean: 9.236011505126953 	 loss mean: 154.3160400390625


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
 30%|███       | 3/10 [00:00<00:00, 24.94it/s][A
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
                                               [A
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.70it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.56it/s][A

nll mean: 145.00108337402344 	 kl mean: 9.236011505126953 	 loss mean: 154.23709106445312
nll mean: 144.88551330566406 	 kl mean: 9.236011505126953 	 loss mean: 154.12152099609375
nll mean: 145.26780700683594 	 kl mean: 9.236011505126953 	 loss mean: 154.50381469726562
nll mean: 145.12701416015625 	 kl mean: 9.236011505126953 	 loss mean: 154.36300659179688
nll mean: 144.39932250976562 	 kl mean: 9.236011505126953 	 loss mean: 153.6353302001953


                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.32it/s]
100%|██████████| 10/10 [00:00<00:00, 24.34it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
 30%|███       | 3/10 [00:00<00:00, 24.64it/s][A

nll mean: 145.20855712890625 	 kl mean: 9.236011505126953 	 loss mean: 154.44456481933594
nll mean: 132.238037109375 	 kl mean: 10.054498672485352 	 loss mean: 142.29254150390625
nll mean: 132.61973571777344 	 kl mean: 10.054498672485352 	 loss mean: 142.6742401123047
nll mean: 132.58489990234375 	 kl mean: 10.054498672485352 	 loss mean: 142.639404296875
nll mean: 133.0801239013672 	 kl mean: 10.054498672485352 	 loss mean: 143.13462829589844


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
 30%|███       | 3/10 [00:00<00:00, 24.64it/s][A
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
                                               [A
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 24.61it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.48it/s][A

nll mean: 132.39332580566406 	 kl mean: 10.054498672485352 	 loss mean: 142.44781494140625
nll mean: 132.2082061767578 	 kl mean: 10.054498672485352 	 loss mean: 142.26271057128906
nll mean: 132.03829956054688 	 kl mean: 10.054498672485352 	 loss mean: 142.09278869628906
nll mean: 132.63796997070312 	 kl mean: 10.054498672485352 	 loss mean: 142.6924591064453
nll mean: 132.83694458007812 	 kl mean: 10.054498672485352 	 loss mean: 142.89144897460938


                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.53it/s]
100%|██████████| 10/10 [00:00<00:00, 24.47it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.72it/s]
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 12.74it/s][A

nll mean: 132.64476013183594 	 kl mean: 10.054498672485352 	 loss mean: 142.6992645263672
nll mean: 127.95130157470703 	 kl mean: 10.387222290039062 	 loss mean: 138.33853149414062
nll mean: 128.41722106933594 	 kl mean: 10.387222290039062 	 loss mean: 138.804443359375


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 20%|██        | 2/10 [00:00<00:00, 12.74it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 40%|████      | 4/10 [00:00<00:00, 12.60it/s][A

nll mean: 128.3940887451172 	 kl mean: 10.387222290039062 	 loss mean: 138.78131103515625
nll mean: 128.40615844726562 	 kl mean: 10.387222290039062 	 loss mean: 138.7933807373047
nll mean: 128.75637817382812 	 kl mean: 10.387222290039062 	 loss mean: 139.14358520507812


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 40%|████      | 4/10 [00:00<00:00, 12.60it/s][A
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.52it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.47it/s][A

nll mean: 128.3609619140625 	 kl mean: 10.387222290039062 	 loss mean: 138.7481689453125
nll mean: 129.10064697265625 	 kl mean: 10.387222290039062 	 loss mean: 139.48785400390625
nll mean: 128.31756591796875 	 kl mean: 10.387222290039062 	 loss mean: 138.7047882080078


                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
                                               [A
 47%|████▋     | 18/38 [00:11<00:11,  1.72it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.47it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.39it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 128.00323486328125 	 kl mean: 10.387222290039062 	 loss mean: 138.39044189453125
nll mean: 128.2425537109375 	 kl mean: 10.387222290039062 	 loss mean: 138.6297607421875
nll mean: 147.4688262939453 	 kl mean: 10.284673690795898 	 loss mean: 157.75350952148438


                                               
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 50%|█████     | 19/38 [00:11<00:12,  1.54it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
 20%|██        | 2/10 [00:00<00:00, 12.52it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.49it/s][A

nll mean: 147.18096923828125 	 kl mean: 10.284673690795898 	 loss mean: 157.46563720703125
nll mean: 147.25228881835938 	 kl mean: 10.284673690795898 	 loss mean: 157.53695678710938
nll mean: 147.54098510742188 	 kl mean: 10.284673690795898 	 loss mean: 157.82566833496094


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
 40%|████      | 4/10 [00:00<00:00, 12.49it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.47it/s][A

nll mean: 147.009765625 	 kl mean: 10.284673690795898 	 loss mean: 157.29444885253906
nll mean: 147.50625610351562 	 kl mean: 10.284673690795898 	 loss mean: 157.79092407226562
nll mean: 146.94107055664062 	 kl mean: 10.284673690795898 	 loss mean: 157.22573852539062


                                               
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.47it/s][A
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
                                               [A
 50%|█████     | 19/38 [00:12<00:12,  1.54it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.47it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.41it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 147.59066772460938 	 kl mean: 10.284673690795898 	 loss mean: 157.87533569335938
nll mean: 147.22972106933594 	 kl mean: 10.284673690795898 	 loss mean: 157.514404296875
nll mean: 146.9060516357422 	 kl mean: 10.284673690795898 	 loss mean: 157.1907196044922


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 20%|██        | 2/10 [00:00<00:00, 12.43it/s][A

nll mean: 156.51766967773438 	 kl mean: 9.653374671936035 	 loss mean: 166.17105102539062
nll mean: 157.43304443359375 	 kl mean: 9.653374671936035 	 loss mean: 167.08641052246094
nll mean: 156.5433349609375 	 kl mean: 9.653374671936035 	 loss mean: 166.19668579101562


                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 20%|██        | 2/10 [00:00<00:00, 12.43it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 40%|████      | 4/10 [00:00<00:00, 12.43it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.42it/s][A

nll mean: 155.86904907226562 	 kl mean: 9.653374671936035 	 loss mean: 165.52239990234375
nll mean: 156.32760620117188 	 kl mean: 9.653374671936035 	 loss mean: 165.98098754882812
nll mean: 156.39219665527344 	 kl mean: 9.653374671936035 	 loss mean: 166.04556274414062


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.42it/s][A
                                               [A
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.43it/s][A

nll mean: 156.75643920898438 	 kl mean: 9.653374671936035 	 loss mean: 166.40982055664062
nll mean: 156.3125457763672 	 kl mean: 9.653374671936035 	 loss mean: 165.96592712402344
nll mean: 156.99423217773438 	 kl mean: 9.653374671936035 	 loss mean: 166.6475830078125


                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.43it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.42it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]

nll mean: 156.5143280029297 	 kl mean: 9.653374671936035 	 loss mean: 166.16769409179688
nll mean: 116.53567504882812 	 kl mean: 10.0143461227417 	 loss mean: 126.55001831054688
nll mean: 116.79345703125 	 kl mean: 10.0143461227417 	 loss mean: 126.80780792236328



  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 10.17it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
 40%|████      | 4/10 [00:00<00:00, 10.22it/s][A

nll mean: 116.26704406738281 	 kl mean: 10.0143461227417 	 loss mean: 126.28138732910156
nll mean: 116.53593444824219 	 kl mean: 10.0143461227417 	 loss mean: 126.55027770996094
nll mean: 115.7734375 	 kl mean: 10.0143461227417 	 loss mean: 125.78778076171875


                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
 40%|████      | 4/10 [00:00<00:00, 10.22it/s][A
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.29it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.26it/s][A

nll mean: 116.76980590820312 	 kl mean: 10.0143461227417 	 loss mean: 126.78414154052734
nll mean: 116.2432632446289 	 kl mean: 10.0143461227417 	 loss mean: 126.25760650634766
nll mean: 116.53446197509766 	 kl mean: 10.0143461227417 	 loss mean: 126.54881286621094


                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s]
                                               [A
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.26it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.27it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 116.60950469970703 	 kl mean: 10.0143461227417 	 loss mean: 126.62384033203125
nll mean: 116.47758483886719 	 kl mean: 10.0143461227417 	 loss mean: 126.49192810058594
nll mean: 105.48958587646484 	 kl mean: 8.745176315307617 	 loss mean: 114.23475646972656
nll mean: 105.54283905029297 	 kl mean: 8.745176315307617 	 loss mean: 114.28800964355469
nll mean: 105.70167541503906 	 kl mean: 8.745176315307617 	 loss mean: 114.44685363769531


                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
 40%|████      | 4/10 [00:00<00:00, 32.76it/s][A
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               [A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
100%|██████████| 10/10 [00:00<00:00, 32.58it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 105.04623413085938 	 kl mean: 8.745176315307617 	 loss mean: 113.79141235351562
nll mean: 105.01060485839844 	 kl mean: 8.745176315307617 	 loss mean: 113.75578308105469
nll mean: 104.73379516601562 	 kl mean: 8.745176315307617 	 loss mean: 113.47896575927734
nll mean: 105.0830078125 	 kl mean: 8.745176315307617 	 loss mean: 113.82818603515625
nll mean: 105.36543273925781 	 kl mean: 8.745176315307617 	 loss mean: 114.11061096191406
nll mean: 105.10829162597656 	 kl mean: 8.745176315307617 	 loss mean: 113.85346984863281
nll mean: 105.32307434082031 	 kl mean: 8.745176315307617 	 loss mean: 114.06825256347656


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.62it/s][A

nll mean: 158.45880126953125 	 kl mean: 9.503730773925781 	 loss mean: 167.9625244140625
nll mean: 158.05906677246094 	 kl mean: 9.503730773925781 	 loss mean: 167.56280517578125
nll mean: 158.42532348632812 	 kl mean: 9.503730773925781 	 loss mean: 167.92904663085938


                                               
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
 20%|██        | 2/10 [00:00<00:00, 14.62it/s][A
                                               [A
 61%|██████    | 23/38 [00:14<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 40%|████      | 4/10 [00:00<00:00, 14.68it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.68it/s][A

nll mean: 158.15322875976562 	 kl mean: 9.503730773925781 	 loss mean: 167.65695190429688
nll mean: 158.16094970703125 	 kl mean: 9.503730773925781 	 loss mean: 167.6646728515625
nll mean: 158.2859649658203 	 kl mean: 9.503730773925781 	 loss mean: 167.78968811035156


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.68it/s][A
                                               [A
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.66it/s][A

nll mean: 158.2215576171875 	 kl mean: 9.503730773925781 	 loss mean: 167.7252960205078
nll mean: 158.2193145751953 	 kl mean: 9.503730773925781 	 loss mean: 167.72305297851562
nll mean: 158.51925659179688 	 kl mean: 9.503730773925781 	 loss mean: 168.02297973632812


                                               
 61%|██████    | 23/38 [00:15<00:09,  1.53it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.66it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.65it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 21.95it/s][A

nll mean: 158.46749877929688 	 kl mean: 9.503730773925781 	 loss mean: 167.97122192382812
nll mean: 119.06278991699219 	 kl mean: 10.406803131103516 	 loss mean: 129.46958923339844
nll mean: 118.55117797851562 	 kl mean: 10.406803131103516 	 loss mean: 128.95799255371094
nll mean: 118.40286254882812 	 kl mean: 10.406803131103516 	 loss mean: 128.80966186523438
nll mean: 119.03428649902344 	 kl mean: 10.406803131103516 	 loss mean: 129.44110107421875


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 21.95it/s][A
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
                                               [A
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.78it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.50it/s][A

nll mean: 118.84015655517578 	 kl mean: 10.406803131103516 	 loss mean: 129.2469482421875
nll mean: 118.82005310058594 	 kl mean: 10.406803131103516 	 loss mean: 129.2268524169922
nll mean: 119.18983459472656 	 kl mean: 10.406803131103516 	 loss mean: 129.59664916992188
nll mean: 119.03422546386719 	 kl mean: 10.406803131103516 	 loss mean: 129.4410400390625
nll mean: 118.70697021484375 	 kl mean: 10.406803131103516 	 loss mean: 129.11376953125


                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.51it/s]
100%|██████████| 10/10 [00:00<00:00, 21.28it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 14.44it/s][A

nll mean: 118.51406860351562 	 kl mean: 10.406803131103516 	 loss mean: 128.92086791992188
nll mean: 111.72766876220703 	 kl mean: 9.80971908569336 	 loss mean: 121.53738403320312
nll mean: 111.27714538574219 	 kl mean: 9.80971908569336 	 loss mean: 121.08685302734375


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.44it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 40%|████      | 4/10 [00:00<00:00, 14.51it/s][A

nll mean: 111.96855163574219 	 kl mean: 9.80971908569336 	 loss mean: 121.77827453613281
nll mean: 111.9546127319336 	 kl mean: 9.80971908569336 	 loss mean: 121.76432800292969
nll mean: 111.82817840576172 	 kl mean: 9.80971908569336 	 loss mean: 121.63789367675781


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 40%|████      | 4/10 [00:00<00:00, 14.51it/s][A
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 60%|██████    | 6/10 [00:00<00:00, 14.56it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.63it/s][A

nll mean: 111.77947998046875 	 kl mean: 9.80971908569336 	 loss mean: 121.58918762207031
nll mean: 112.25155639648438 	 kl mean: 9.80971908569336 	 loss mean: 122.06127166748047
nll mean: 111.76959228515625 	 kl mean: 9.80971908569336 	 loss mean: 121.57931518554688


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
                                               [A
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s]
 80%|████████  | 8/10 [00:00<00:00, 14.63it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.63it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 112.40401458740234 	 kl mean: 9.80971908569336 	 loss mean: 122.21373748779297
nll mean: 111.43470764160156 	 kl mean: 9.80971908569336 	 loss mean: 121.24443054199219
nll mean: 81.650634765625 	 kl mean: 8.625319480895996 	 loss mean: 90.27595520019531
nll mean: 82.0064697265625 	 kl mean: 8.625319480895996 	 loss mean: 90.63178253173828


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 22.35it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.20it/s][A

nll mean: 82.15177917480469 	 kl mean: 8.625319480895996 	 loss mean: 90.77710723876953
nll mean: 82.34062194824219 	 kl mean: 8.625319480895996 	 loss mean: 90.9659423828125
nll mean: 82.11868286132812 	 kl mean: 8.625319480895996 	 loss mean: 90.74400329589844
nll mean: 81.33927154541016 	 kl mean: 8.625319480895996 	 loss mean: 89.96459197998047
nll mean: 81.48960876464844 	 kl mean: 8.625319480895996 	 loss mean: 90.11492919921875


                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 60%|██████    | 6/10 [00:00<00:00, 22.20it/s][A
                                               [A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
100%|██████████| 10/10 [00:00<00:00, 21.64it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.72it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 81.75163269042969 	 kl mean: 8.625319480895996 	 loss mean: 90.376953125
nll mean: 81.87313842773438 	 kl mean: 8.625319480895996 	 loss mean: 90.49845123291016
nll mean: 82.32743835449219 	 kl mean: 8.625319480895996 	 loss mean: 90.9527587890625
nll mean: 109.22825622558594 	 kl mean: 8.647315979003906 	 loss mean: 117.87556457519531
nll mean: 109.0152587890625 	 kl mean: 8.647315979003906 	 loss mean: 117.66258239746094


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
 30%|███       | 3/10 [00:00<00:00, 21.50it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.54it/s][A

nll mean: 109.11457061767578 	 kl mean: 8.647315979003906 	 loss mean: 117.76188659667969
nll mean: 107.95962524414062 	 kl mean: 8.647315979003906 	 loss mean: 116.60693359375
nll mean: 109.10603332519531 	 kl mean: 8.647315979003906 	 loss mean: 117.75334167480469
nll mean: 108.88439178466797 	 kl mean: 8.647315979003906 	 loss mean: 117.53170776367188
nll mean: 108.29696655273438 	 kl mean: 8.647315979003906 	 loss mean: 116.94429016113281


                                               
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.54it/s][A
                                               [A
 71%|███████   | 27/38 [00:17<00:06,  1.72it/s]
100%|██████████| 10/10 [00:00<00:00, 21.53it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 108.91171264648438 	 kl mean: 8.647315979003906 	 loss mean: 117.55902862548828
nll mean: 108.97533416748047 	 kl mean: 8.647315979003906 	 loss mean: 117.62264251708984
nll mean: 108.79629516601562 	 kl mean: 8.647315979003906 	 loss mean: 117.44361877441406
nll mean: 120.37930297851562 	 kl mean: 9.678537368774414 	 loss mean: 130.05783081054688


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
 20%|██        | 2/10 [00:00<00:00, 12.53it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.51it/s][A

nll mean: 120.25299072265625 	 kl mean: 9.678537368774414 	 loss mean: 129.93153381347656
nll mean: 120.2568359375 	 kl mean: 9.678537368774414 	 loss mean: 129.93536376953125
nll mean: 120.89722442626953 	 kl mean: 9.678537368774414 	 loss mean: 130.57577514648438


                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
 40%|████      | 4/10 [00:00<00:00, 12.51it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.52it/s][A

nll mean: 120.35299682617188 	 kl mean: 9.678537368774414 	 loss mean: 130.0315399169922
nll mean: 120.46553802490234 	 kl mean: 9.678537368774414 	 loss mean: 130.14407348632812
nll mean: 120.05486297607422 	 kl mean: 9.678537368774414 	 loss mean: 129.7333984375


                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.83it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.52it/s][A
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.83it/s]
                                               [A
 74%|███████▎  | 28/38 [00:18<00:05,  1.83it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.57it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.56it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 120.58602905273438 	 kl mean: 9.678537368774414 	 loss mean: 130.2645721435547
nll mean: 119.96277618408203 	 kl mean: 9.678537368774414 	 loss mean: 129.6413116455078
nll mean: 120.19300842285156 	 kl mean: 9.678537368774414 	 loss mean: 129.87155151367188


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.08it/s][A

nll mean: 60.2855339050293 	 kl mean: 10.55302619934082 	 loss mean: 70.83855438232422
nll mean: 59.98859405517578 	 kl mean: 10.55302619934082 	 loss mean: 70.5416259765625


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 20%|██        | 2/10 [00:00<00:00, 10.08it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 30%|███       | 3/10 [00:00<00:00,  9.97it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.03it/s][A

nll mean: 59.986541748046875 	 kl mean: 10.55302619934082 	 loss mean: 70.53956604003906
nll mean: 60.466064453125 	 kl mean: 10.55302619934082 	 loss mean: 71.01908874511719
nll mean: 59.962432861328125 	 kl mean: 10.55302619934082 	 loss mean: 70.51545715332031


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:18<00:05,  1.61it/s]
 50%|█████     | 5/10 [00:00<00:00, 10.03it/s][A
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s]
 70%|███████   | 7/10 [00:00<00:00, 10.11it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.07it/s][A

nll mean: 61.20248794555664 	 kl mean: 10.55302619934082 	 loss mean: 71.7555160522461
nll mean: 60.034061431884766 	 kl mean: 10.55302619934082 	 loss mean: 70.58708953857422
nll mean: 60.56043243408203 	 kl mean: 10.55302619934082 	 loss mean: 71.11345672607422


                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s]
                                               [A
 76%|███████▋  | 29/38 [00:19<00:05,  1.61it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.07it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.07it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 60.17157745361328 	 kl mean: 10.55302619934082 	 loss mean: 70.724609375
nll mean: 60.2880973815918 	 kl mean: 10.55302619934082 	 loss mean: 70.84112548828125
nll mean: 103.39374542236328 	 kl mean: 10.07440185546875 	 loss mean: 113.4681396484375


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 20%|██        | 2/10 [00:00<00:00, 12.90it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.75it/s][A

nll mean: 103.23400115966797 	 kl mean: 10.07440185546875 	 loss mean: 113.30841064453125
nll mean: 103.83621215820312 	 kl mean: 10.07440185546875 	 loss mean: 113.9106216430664
nll mean: 103.24607849121094 	 kl mean: 10.07440185546875 	 loss mean: 113.32048034667969


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 40%|████      | 4/10 [00:00<00:00, 12.75it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.80it/s][A

nll mean: 103.48847961425781 	 kl mean: 10.07440185546875 	 loss mean: 113.56288146972656
nll mean: 103.75178527832031 	 kl mean: 10.07440185546875 	 loss mean: 113.82618713378906
nll mean: 103.80038452148438 	 kl mean: 10.07440185546875 	 loss mean: 113.87478637695312


                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.80it/s][A
                                               [A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               [A
 79%|███████▉  | 30/38 [00:20<00:05,  1.36it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.84it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.73it/s][A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 103.03155517578125 	 kl mean: 10.07440185546875 	 loss mean: 113.10596466064453
nll mean: 104.07963562011719 	 kl mean: 10.07440185546875 	 loss mean: 114.15403747558594
nll mean: 103.47146606445312 	 kl mean: 10.07440185546875 	 loss mean: 113.54586791992188


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A

nll mean: 136.7332305908203 	 kl mean: 10.455705642700195 	 loss mean: 147.18893432617188
nll mean: 136.60739135742188 	 kl mean: 10.455705642700195 	 loss mean: 147.06309509277344



 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 20%|██        | 2/10 [00:00<00:00, 10.09it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 10.02it/s][A
                                               [A

nll mean: 136.35629272460938 	 kl mean: 10.455705642700195 	 loss mean: 146.81199645996094
nll mean: 136.03451538085938 	 kl mean: 10.455705642700195 	 loss mean: 146.49021911621094



 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 40%|████      | 4/10 [00:00<00:00, 10.00it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 50%|█████     | 5/10 [00:00<00:00,  9.97it/s][A
                                               [A


nll mean: 136.76730346679688 	 kl mean: 10.455705642700195 	 loss mean: 147.2230224609375
nll mean: 136.6078338623047 	 kl mean: 10.455705642700195 	 loss mean: 147.06353759765625


 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]
 60%|██████    | 6/10 [00:00<00:00,  9.94it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:20<00:05,  1.33it/s]


nll mean: 136.57586669921875 	 kl mean: 10.455705642700195 	 loss mean: 147.03155517578125
nll mean: 136.45562744140625 	 kl mean: 10.455705642700195 	 loss mean: 146.91134643554688
nll mean: 136.23403930664062 	 kl mean: 10.455705642700195 	 loss mean: 146.6897430419922


 80%|████████  | 8/10 [00:00<00:00,  9.98it/s][A
                                               [A
 82%|████████▏ | 31/38 [00:21<00:05,  1.33it/s]
 90%|█████████ | 9/10 [00:01<00:00,  9.95it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.95it/s][A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 30%|███       | 3/10 [00:00<00:00, 25.95it/s][A

nll mean: 136.33177185058594 	 kl mean: 10.455705642700195 	 loss mean: 146.78749084472656
nll mean: 62.79624557495117 	 kl mean: 9.313054084777832 	 loss mean: 72.10929870605469
nll mean: 62.69451141357422 	 kl mean: 9.313054084777832 	 loss mean: 72.007568359375
nll mean: 62.83989715576172 	 kl mean: 9.313054084777832 	 loss mean: 72.15294647216797
nll mean: 62.797996520996094 	 kl mean: 9.313054084777832 	 loss mean: 72.11105346679688
nll mean: 62.647911071777344 	 kl mean: 9.313054084777832 	 loss mean: 71.96096801757812


                                               
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 30%|███       | 3/10 [00:00<00:00, 25.95it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
 60%|██████    | 6/10 [00:00<00:00, 25.72it/s][A
                                               [A
 84%|████████▍ | 32/38 [00:21<00:04,  1.21it/s]
100%|██████████| 10/10 [00:00<00:00, 25.43it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 62.45182418823242 	 kl mean: 9.313054084777832 	 loss mean: 71.76487731933594
nll mean: 62.35614013671875 	 kl mean: 9.313054084777832 	 loss mean: 71.66919708251953
nll mean: 62.432804107666016 	 kl mean: 9.313054084777832 	 loss mean: 71.74585723876953
nll mean: 62.484466552734375 	 kl mean: 9.313054084777832 	 loss mean: 71.79751586914062
nll mean: 62.934959411621094 	 kl mean: 9.313054084777832 	 loss mean: 72.24801635742188


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 30%|███       | 3/10 [00:00<00:00, 21.39it/s][A

nll mean: 118.65338134765625 	 kl mean: 9.013278007507324 	 loss mean: 127.66665649414062
nll mean: 118.40606689453125 	 kl mean: 9.013278007507324 	 loss mean: 127.41934204101562
nll mean: 118.82846069335938 	 kl mean: 9.013278007507324 	 loss mean: 127.84174346923828
nll mean: 118.25796508789062 	 kl mean: 9.013278007507324 	 loss mean: 127.27125549316406
nll mean: 118.83015441894531 	 kl mean: 9.013278007507324 	 loss mean: 127.84343719482422


                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 30%|███       | 3/10 [00:00<00:00, 21.39it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.35it/s][A
                                               [A
 87%|████████▋ | 33/38 [00:21<00:03,  1.43it/s]
100%|██████████| 10/10 [00:00<00:00, 21.14it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 118.47350311279297 	 kl mean: 9.013278007507324 	 loss mean: 127.48678588867188
nll mean: 118.84156799316406 	 kl mean: 9.013278007507324 	 loss mean: 127.85484313964844
nll mean: 118.6471176147461 	 kl mean: 9.013278007507324 	 loss mean: 127.66038513183594
nll mean: 118.69810485839844 	 kl mean: 9.013278007507324 	 loss mean: 127.71138763427734
nll mean: 118.8504409790039 	 kl mean: 9.013278007507324 	 loss mean: 127.86372375488281


                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.45it/s][A

nll mean: 118.47724914550781 	 kl mean: 10.465352058410645 	 loss mean: 128.94259643554688
nll mean: 118.58860778808594 	 kl mean: 10.465352058410645 	 loss mean: 129.053955078125
nll mean: 118.31427764892578 	 kl mean: 10.465352058410645 	 loss mean: 128.77963256835938


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.45it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 40%|████      | 4/10 [00:00<00:00, 12.47it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.39it/s][A

nll mean: 118.71987915039062 	 kl mean: 10.465352058410645 	 loss mean: 129.18524169921875
nll mean: 118.95252227783203 	 kl mean: 10.465352058410645 	 loss mean: 129.41787719726562
nll mean: 118.63873291015625 	 kl mean: 10.465352058410645 	 loss mean: 129.10409545898438


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 60%|██████    | 6/10 [00:00<00:00, 12.39it/s][A
                                               [A
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.46it/s][A

nll mean: 118.19992065429688 	 kl mean: 10.465352058410645 	 loss mean: 128.66526794433594
nll mean: 118.79049682617188 	 kl mean: 10.465352058410645 	 loss mean: 129.255859375
nll mean: 119.16796875 	 kl mean: 10.465352058410645 	 loss mean: 129.63330078125


                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 80%|████████  | 8/10 [00:00<00:00, 12.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.38it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
 20%|██        | 2/10 [00:00<00:00, 10.62it/s][A

nll mean: 118.57282257080078 	 kl mean: 10.465352058410645 	 loss mean: 129.03817749023438
nll mean: 113.70880126953125 	 kl mean: 9.34712028503418 	 loss mean: 123.05592346191406
nll mean: 113.10104370117188 	 kl mean: 9.34712028503418 	 loss mean: 122.44816589355469


                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.62it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 10.59it/s][A

nll mean: 113.86064910888672 	 kl mean: 9.34712028503418 	 loss mean: 123.207763671875
nll mean: 114.11898803710938 	 kl mean: 9.34712028503418 	 loss mean: 123.46611022949219
nll mean: 113.52344512939453 	 kl mean: 9.34712028503418 	 loss mean: 122.87055969238281


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 40%|████      | 4/10 [00:00<00:00, 10.59it/s][A
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 60%|██████    | 6/10 [00:00<00:00, 10.61it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.64it/s][A

nll mean: 113.48686981201172 	 kl mean: 9.34712028503418 	 loss mean: 122.83399200439453
nll mean: 113.39645385742188 	 kl mean: 9.34712028503418 	 loss mean: 122.74357604980469
nll mean: 113.50257873535156 	 kl mean: 9.34712028503418 	 loss mean: 122.84969329833984


                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
                                               [A
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s]
 80%|████████  | 8/10 [00:00<00:00, 10.64it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.61it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 114.01237487792969 	 kl mean: 9.34712028503418 	 loss mean: 123.3594970703125
nll mean: 114.02195739746094 	 kl mean: 9.34712028503418 	 loss mean: 123.36907958984375
nll mean: 111.03170013427734 	 kl mean: 9.609739303588867 	 loss mean: 120.64143371582031
nll mean: 110.7728271484375 	 kl mean: 9.609739303588867 	 loss mean: 120.382568359375


                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 21.70it/s][A
                                               [A
                                              

nll mean: 110.61406707763672 	 kl mean: 9.609739303588867 	 loss mean: 120.22380065917969
nll mean: 110.65785217285156 	 kl mean: 9.609739303588867 	 loss mean: 120.26759338378906
nll mean: 110.50173950195312 	 kl mean: 9.609739303588867 	 loss mean: 120.11146545410156
nll mean: 110.3663101196289 	 kl mean: 9.609739303588867 	 loss mean: 119.97604370117188


 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
 60%|██████    | 6/10 [00:00<00:00, 21.46it/s][A
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
                                               [A
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s]
100%|██████████| 10/10 [00:00<00:00, 20.76it/s][A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 110.90955352783203 	 kl mean: 9.609739303588867 	 loss mean: 120.51929473876953
nll mean: 110.89706420898438 	 kl mean: 9.609739303588867 	 loss mean: 120.50679779052734
nll mean: 110.88139343261719 	 kl mean: 9.609739303588867 	 loss mean: 120.49111938476562
nll mean: 110.61927795410156 	 kl mean: 9.609739303588867 	 loss mean: 120.22901916503906
nll mean: 84.3863296508789 	 kl mean: 10.991235733032227 	 loss mean: 95.3775634765625


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
 40%|████      | 4/10 [00:00<00:00, 30.68it/s][A
 80%|████████  | 8/10 [00:00<00:00, 30.55it/s][A

nll mean: 84.01912689208984 	 kl mean: 10.991235733032227 	 loss mean: 95.01036834716797
nll mean: 84.43775177001953 	 kl mean: 10.991235733032227 	 loss mean: 95.42900085449219
nll mean: 84.29346466064453 	 kl mean: 10.991235733032227 	 loss mean: 95.2846908569336
nll mean: 84.22625732421875 	 kl mean: 10.991235733032227 	 loss mean: 95.21749114990234
nll mean: 83.60585021972656 	 kl mean: 10.991235733032227 	 loss mean: 94.5970687866211
nll mean: 83.56087493896484 	 kl mean: 10.991235733032227 	 loss mean: 94.55210876464844
nll mean: 84.50604248046875 	 kl mean: 10.991235733032227 	 loss mean: 95.49727630615234


                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
                                               [A
 97%|█████████▋| 37/38 [00:24<00:00,  1.47it/s]
100%|██████████| 10/10 [00:00<00:00, 30.45it/s][A
100%|██████████| 38/38 [00:24<00:00,  1.55it/s]


nll mean: 84.3438720703125 	 kl mean: 10.991235733032227 	 loss mean: 95.3351058959961
nll mean: 84.56156158447266 	 kl mean: 10.991235733032227 	 loss mean: 95.55279541015625
Approximate NLL:
tensor(120.5020, device='cuda:0')
Approximate KL:
tensor(9.8161, device='cuda:0')
Testing took 0:00:25.451330


  0%|          | 0/38 [00:00<?, ?it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
                                      
  0%|          | 0/38 [00:00<?, ?it/s][A
 30%|███       | 3/10 [00:00<00:00, 26.01it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].01it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].01it/s][A
                                              

nll mean: 110.3531494140625 	 kl mean: 10.285588264465332 	 loss mean: 120.63874053955078
nll mean: 109.29132080078125 	 kl mean: 10.285588264465332 	 loss mean: 119.57691192626953
nll mean: 109.1849365234375 	 kl mean: 10.285588264465332 	 loss mean: 119.47052001953125
nll mean: 109.50045776367188 	 kl mean: 10.285588264465332 	 loss mean: 119.78604888916016
nll mean: 110.00563049316406 	 kl mean: 10.285588264465332 	 loss mean: 120.29121398925781



  0%|          | 0/38 [00:00<?, ?it/s].01it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.66it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].66it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].66it/s][A
                                              
  0%|          | 0/38 [00:00<?, ?it/s].66it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.41it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 25.11it/s][A
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 109.28099060058594 	 kl mean: 10.285588264465332 	 loss mean: 119.56657409667969
nll mean: 108.70108795166016 	 kl mean: 10.285588264465332 	 loss mean: 118.98667907714844
nll mean: 109.27044677734375 	 kl mean: 10.285588264465332 	 loss mean: 119.55603790283203
nll mean: 108.96043395996094 	 kl mean: 10.285588264465332 	 loss mean: 119.24602508544922
nll mean: 109.8648452758789 	 kl mean: 10.285588264465332 	 loss mean: 120.15043640136719



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s]
 20%|██        | 2/10 [00:00<00:00, 13.62it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s][A

nll mean: 125.09107208251953 	 kl mean: 9.757591247558594 	 loss mean: 134.84866333007812
nll mean: 126.22123718261719 	 kl mean: 9.757591247558594 	 loss mean: 135.97882080078125
nll mean: 125.18434143066406 	 kl mean: 9.757591247558594 	 loss mean: 134.94192504882812



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s][A
 40%|████      | 4/10 [00:00<00:00, 13.68it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s][A
 60%|██████    | 6/10 [00:00<00:00, 13.76it/s][A

nll mean: 125.32391357421875 	 kl mean: 9.757591247558594 	 loss mean: 135.08151245117188
nll mean: 125.18098449707031 	 kl mean: 9.757591247558594 	 loss mean: 134.93856811523438
nll mean: 125.00131225585938 	 kl mean: 9.757591247558594 	 loss mean: 134.7589111328125



                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s][A
                                              
  3%|▎         | 1/38 [00:00<00:14,  2.50it/s][A
 80%|████████  | 8/10 [00:00<00:00, 13.71it/s][A
                                              
  3%|▎         | 1/38 [00:01<00:14,  2.50it/s][A

nll mean: 125.33026885986328 	 kl mean: 9.757591247558594 	 loss mean: 135.08786010742188
nll mean: 125.76815795898438 	 kl mean: 9.757591247558594 	 loss mean: 135.5257568359375
nll mean: 125.6883544921875 	 kl mean: 9.757591247558594 	 loss mean: 135.4459228515625



                                              
  3%|▎         | 1/38 [00:01<00:14,  2.50it/s][A
100%|██████████| 10/10 [00:00<00:00, 13.79it/s][A
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s]
 30%|███       | 3/10 [00:00<00:00, 24.77it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A

nll mean: 125.24897003173828 	 kl mean: 9.757591247558594 	 loss mean: 135.00656127929688
nll mean: 98.83914184570312 	 kl mean: 8.78410530090332 	 loss mean: 107.62326049804688
nll mean: 98.42103576660156 	 kl mean: 8.78410530090332 	 loss mean: 107.20513153076172
nll mean: 98.48040008544922 	 kl mean: 8.78410530090332 	 loss mean: 107.2645034790039
nll mean: 98.99650573730469 	 kl mean: 8.78410530090332 	 loss mean: 107.78060913085938



                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.56it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
                                              
  5%|▌         | 2/38 [00:01<00:17,  2.01it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.44it/s][A

nll mean: 99.14523315429688 	 kl mean: 8.78410530090332 	 loss mean: 107.92933654785156
nll mean: 98.22499084472656 	 kl mean: 8.78410530090332 	 loss mean: 107.00910949707031
nll mean: 98.81781005859375 	 kl mean: 8.78410530090332 	 loss mean: 107.60191345214844
nll mean: 98.60610961914062 	 kl mean: 8.78410530090332 	 loss mean: 107.39021301269531
nll mean: 98.76690673828125 	 kl mean: 8.78410530090332 	 loss mean: 107.55101776123047



                                              
100%|██████████| 10/10 [00:00<00:00, 24.40it/s][A
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s]
 20%|██        | 2/10 [00:00<00:00, 10.74it/s][A

nll mean: 98.68402099609375 	 kl mean: 8.78410530090332 	 loss mean: 107.46812438964844
nll mean: 138.68646240234375 	 kl mean: 9.09825611114502 	 loss mean: 147.78469848632812
nll mean: 138.80320739746094 	 kl mean: 9.09825611114502 	 loss mean: 147.90145874023438



                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:01<00:16,  2.12it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.77it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A

nll mean: 138.36273193359375 	 kl mean: 9.09825611114502 	 loss mean: 147.46099853515625
nll mean: 138.78128051757812 	 kl mean: 9.09825611114502 	 loss mean: 147.87954711914062
nll mean: 138.40985107421875 	 kl mean: 9.09825611114502 	 loss mean: 147.50811767578125



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.80it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.79it/s][A

nll mean: 138.57131958007812 	 kl mean: 9.09825611114502 	 loss mean: 147.66958618164062
nll mean: 138.0191650390625 	 kl mean: 9.09825611114502 	 loss mean: 147.11741638183594
nll mean: 137.97560119628906 	 kl mean: 9.09825611114502 	 loss mean: 147.0738525390625



                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
                                              
  8%|▊         | 3/38 [00:02<00:16,  2.12it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.79it/s][A
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]

nll mean: 138.36126708984375 	 kl mean: 9.09825611114502 	 loss mean: 147.45953369140625
nll mean: 138.295166015625 	 kl mean: 9.09825611114502 	 loss mean: 147.3934326171875
nll mean: 126.01953125 	 kl mean: 8.676916122436523 	 loss mean: 134.69644165039062



                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s]
 20%|██        | 2/10 [00:00<00:00, 14.34it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.16it/s][A

nll mean: 126.52523803710938 	 kl mean: 8.676916122436523 	 loss mean: 135.2021484375
nll mean: 126.19342041015625 	 kl mean: 8.676916122436523 	 loss mean: 134.87033081054688
nll mean: 126.0106201171875 	 kl mean: 8.676916122436523 	 loss mean: 134.68753051757812



                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.06it/s][A
                                              
 11%|█         | 4/38 [00:02<00:20,  1.64it/s][A

nll mean: 126.62249755859375 	 kl mean: 8.676916122436523 	 loss mean: 135.29940795898438
nll mean: 126.65423583984375 	 kl mean: 8.676916122436523 	 loss mean: 135.33116149902344
nll mean: 126.018310546875 	 kl mean: 8.676916122436523 	 loss mean: 134.69522094726562



                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.05it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s][A
                                              
 11%|█         | 4/38 [00:03<00:20,  1.64it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.07it/s][A
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 126.49024963378906 	 kl mean: 8.676916122436523 	 loss mean: 135.1671600341797
nll mean: 126.42400360107422 	 kl mean: 8.676916122436523 	 loss mean: 135.10092163085938
nll mean: 126.66222381591797 	 kl mean: 8.676916122436523 	 loss mean: 135.33914184570312



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s]
 20%|██        | 2/10 [00:00<00:00, 14.40it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 123.71062469482422 	 kl mean: 8.882162094116211 	 loss mean: 132.59278869628906
nll mean: 123.29006958007812 	 kl mean: 8.882162094116211 	 loss mean: 132.1722412109375
nll mean: 123.86357116699219 	 kl mean: 8.882162094116211 	 loss mean: 132.74574279785156



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.34it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.45it/s][A

nll mean: 123.11767578125 	 kl mean: 8.882162094116211 	 loss mean: 131.99984741210938
nll mean: 123.53215789794922 	 kl mean: 8.882162094116211 	 loss mean: 132.41433715820312
nll mean: 123.38919067382812 	 kl mean: 8.882162094116211 	 loss mean: 132.2713623046875



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.24it/s][A
                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A

nll mean: 123.79563903808594 	 kl mean: 8.882162094116211 	 loss mean: 132.67779541015625
nll mean: 123.58677673339844 	 kl mean: 8.882162094116211 	 loss mean: 132.46893310546875
nll mean: 123.76896667480469 	 kl mean: 8.882162094116211 	 loss mean: 132.651123046875



                                              
 13%|█▎        | 5/38 [00:03<00:21,  1.56it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.21it/s][A
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:03<00:21,  1.51it/s]
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s]
 30%|███       | 3/10 [00:00<00:00, 25.37it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A

nll mean: 123.61837768554688 	 kl mean: 8.882162094116211 	 loss mean: 132.50054931640625
nll mean: 133.54721069335938 	 kl mean: 8.485042572021484 	 loss mean: 142.03224182128906
nll mean: 134.245361328125 	 kl mean: 8.485042572021484 	 loss mean: 142.7303924560547
nll mean: 134.3497314453125 	 kl mean: 8.485042572021484 	 loss mean: 142.83477783203125
nll mean: 133.82272338867188 	 kl mean: 8.485042572021484 	 loss mean: 142.3077392578125



                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.13it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
                                              
 16%|█▌        | 6/38 [00:04<00:21,  1.51it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.95it/s][A

nll mean: 134.1706085205078 	 kl mean: 8.485042572021484 	 loss mean: 142.6556396484375
nll mean: 134.69430541992188 	 kl mean: 8.485042572021484 	 loss mean: 143.1793670654297
nll mean: 134.2745361328125 	 kl mean: 8.485042572021484 	 loss mean: 142.75958251953125
nll mean: 134.1405029296875 	 kl mean: 8.485042572021484 	 loss mean: 142.62554931640625
nll mean: 134.0070343017578 	 kl mean: 8.485042572021484 	 loss mean: 142.49208068847656



                                              
100%|██████████| 10/10 [00:00<00:00, 24.75it/s][A
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s]
 30%|███       | 3/10 [00:00<00:00, 24.59it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A

nll mean: 133.75674438476562 	 kl mean: 8.485042572021484 	 loss mean: 142.2417755126953
nll mean: 105.75352478027344 	 kl mean: 8.962804794311523 	 loss mean: 114.7163314819336
nll mean: 106.29307556152344 	 kl mean: 8.962804794311523 	 loss mean: 115.2558822631836
nll mean: 105.69693756103516 	 kl mean: 8.962804794311523 	 loss mean: 114.65974426269531
nll mean: 106.32362365722656 	 kl mean: 8.962804794311523 	 loss mean: 115.28643035888672



                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.56it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
                                              
 18%|█▊        | 7/38 [00:04<00:18,  1.71it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.52it/s][A

nll mean: 106.02571868896484 	 kl mean: 8.962804794311523 	 loss mean: 114.988525390625
nll mean: 105.695068359375 	 kl mean: 8.962804794311523 	 loss mean: 114.65786743164062
nll mean: 105.73077392578125 	 kl mean: 8.962804794311523 	 loss mean: 114.6935806274414
nll mean: 105.76858520507812 	 kl mean: 8.962804794311523 	 loss mean: 114.73139190673828
nll mean: 105.66571044921875 	 kl mean: 8.962804794311523 	 loss mean: 114.6285171508789



                                              
100%|██████████| 10/10 [00:00<00:00, 24.47it/s][A
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s]
 20%|██        | 2/10 [00:00<00:00, 14.61it/s][A

nll mean: 106.46373748779297 	 kl mean: 8.962804794311523 	 loss mean: 115.42654418945312
nll mean: 131.97079467773438 	 kl mean: 9.483479499816895 	 loss mean: 141.45428466796875
nll mean: 132.6988983154297 	 kl mean: 9.483479499816895 	 loss mean: 142.18238830566406



                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:04<00:15,  1.88it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.71it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A

nll mean: 132.06080627441406 	 kl mean: 9.483479499816895 	 loss mean: 141.54428100585938
nll mean: 132.68453979492188 	 kl mean: 9.483479499816895 	 loss mean: 142.16802978515625
nll mean: 132.34088134765625 	 kl mean: 9.483479499816895 	 loss mean: 141.82437133789062



                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.79it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.84it/s][A


nll mean: 131.36326599121094 	 kl mean: 9.483479499816895 	 loss mean: 140.84674072265625
nll mean: 132.15994262695312 	 kl mean: 9.483479499816895 	 loss mean: 141.64341735839844
nll mean: 132.26956176757812 	 kl mean: 9.483479499816895 	 loss mean: 141.7530517578125


                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
                                              
 21%|██        | 8/38 [00:05<00:15,  1.88it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.57it/s][A
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]

nll mean: 132.60140991210938 	 kl mean: 9.483479499816895 	 loss mean: 142.0848846435547
nll mean: 131.9208984375 	 kl mean: 9.483479499816895 	 loss mean: 141.40438842773438
nll mean: 130.85470581054688 	 kl mean: 9.610123634338379 	 loss mean: 140.46482849121094
nll mean: 130.71295166015625 	 kl mean: 9.610123634338379 	 loss mean: 140.3230743408203



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.80it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.55it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A

nll mean: 131.40359497070312 	 kl mean: 9.610123634338379 	 loss mean: 141.01370239257812
nll mean: 131.53585815429688 	 kl mean: 9.610123634338379 	 loss mean: 141.14599609375
nll mean: 131.0269775390625 	 kl mean: 9.610123634338379 	 loss mean: 140.63710021972656
nll mean: 130.814453125 	 kl mean: 9.610123634338379 	 loss mean: 140.42457580566406
nll mean: 131.0404815673828 	 kl mean: 9.610123634338379 	 loss mean: 140.65060424804688



                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
                                              
 24%|██▎       | 9/38 [00:05<00:16,  1.73it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.35it/s][A
                                              
100%|██████████| 10/10 [00:00<00:00, 21.13it/s][A
 26%|██▋       | 10/38 [00:05<00:15,  1.82it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.82it/s]
                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.82it/s]

nll mean: 130.97862243652344 	 kl mean: 9.610123634338379 	 loss mean: 140.5887451171875
nll mean: 130.61483764648438 	 kl mean: 9.610123634338379 	 loss mean: 140.22494506835938
nll mean: 130.67520141601562 	 kl mean: 9.610123634338379 	 loss mean: 140.2853240966797
nll mean: 119.08261108398438 	 kl mean: 9.709797859191895 	 loss mean: 128.79241943359375
nll mean: 118.51821899414062 	 kl mean: 9.709797859191895 	 loss mean: 128.22802734375



                                               
 26%|██▋       | 10/38 [00:05<00:15,  1.82it/s]
 30%|███       | 3/10 [00:00<00:00, 25.10it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.82it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.82it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.82it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.71it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.82it/s][A

nll mean: 119.52874755859375 	 kl mean: 9.709797859191895 	 loss mean: 129.23855590820312
nll mean: 119.30036926269531 	 kl mean: 9.709797859191895 	 loss mean: 129.01016235351562
nll mean: 119.63818359375 	 kl mean: 9.709797859191895 	 loss mean: 129.3479766845703
nll mean: 119.32870483398438 	 kl mean: 9.709797859191895 	 loss mean: 129.03851318359375
nll mean: 119.12788391113281 	 kl mean: 9.709797859191895 	 loss mean: 128.83767700195312



                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.82it/s][A
                                               
 26%|██▋       | 10/38 [00:06<00:15,  1.82it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.41it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 24.13it/s][A
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]

nll mean: 119.25848388671875 	 kl mean: 9.709797859191895 	 loss mean: 128.96827697753906
nll mean: 119.23640441894531 	 kl mean: 9.709797859191895 	 loss mean: 128.94619750976562
nll mean: 118.94528198242188 	 kl mean: 9.709797859191895 	 loss mean: 128.6550750732422
nll mean: 141.26870727539062 	 kl mean: 9.448381423950195 	 loss mean: 150.7170867919922
nll mean: 141.04458618164062 	 kl mean: 9.448381423950195 	 loss mean: 150.49295043945312



                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s]
 30%|███       | 3/10 [00:00<00:00, 21.56it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.26it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s][A

nll mean: 141.75839233398438 	 kl mean: 9.448381423950195 	 loss mean: 151.20675659179688
nll mean: 141.37457275390625 	 kl mean: 9.448381423950195 	 loss mean: 150.82293701171875
nll mean: 141.50515747070312 	 kl mean: 9.448381423950195 	 loss mean: 150.9535369873047
nll mean: 141.49900817871094 	 kl mean: 9.448381423950195 	 loss mean: 150.9473876953125
nll mean: 141.05323791503906 	 kl mean: 9.448381423950195 	 loss mean: 150.50161743164062



                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s][A
                                               
 29%|██▉       | 11/38 [00:06<00:13,  1.97it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.04it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 20.89it/s][A
 32%|███▏      | 12/38 [00:06<00:13,  2.00it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 32%|███▏      | 12/38 [00:06<00:13,  2.00it/s]

nll mean: 141.53143310546875 	 kl mean: 9.448381423950195 	 loss mean: 150.97982788085938
nll mean: 141.15115356445312 	 kl mean: 9.448381423950195 	 loss mean: 150.5995330810547
nll mean: 140.8505859375 	 kl mean: 9.448381423950195 	 loss mean: 150.29898071289062
nll mean: 121.4420166015625 	 kl mean: 9.776752471923828 	 loss mean: 131.21876525878906



                                               
 32%|███▏      | 12/38 [00:06<00:13,  2.00it/s]
 20%|██        | 2/10 [00:00<00:00, 12.16it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.23it/s][A

nll mean: 121.20370483398438 	 kl mean: 9.776752471923828 	 loss mean: 130.98046875
nll mean: 121.05519104003906 	 kl mean: 9.776752471923828 	 loss mean: 130.8319549560547
nll mean: 120.96544647216797 	 kl mean: 9.776752471923828 	 loss mean: 130.7421875



                                               
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.28it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s][A

nll mean: 121.08490753173828 	 kl mean: 9.776752471923828 	 loss mean: 130.86166381835938
nll mean: 121.09048461914062 	 kl mean: 9.776752471923828 	 loss mean: 130.8672332763672
nll mean: 121.2984390258789 	 kl mean: 9.776752471923828 	 loss mean: 131.0751953125



                                               
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.33it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s][A
                                               
 32%|███▏      | 12/38 [00:07<00:13,  2.00it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.34it/s][A
 34%|███▍      | 13/38 [00:07<00:14,  1.68it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 121.20111083984375 	 kl mean: 9.776752471923828 	 loss mean: 130.97787475585938
nll mean: 120.66639709472656 	 kl mean: 9.776752471923828 	 loss mean: 130.44314575195312
nll mean: 121.55879974365234 	 kl mean: 9.776752471923828 	 loss mean: 131.33554077148438



                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.68it/s]
 10%|█         | 1/10 [00:00<00:00,  9.97it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.68it/s][A
 20%|██        | 2/10 [00:00<00:00,  9.89it/s][A
                                               

nll mean: 161.68399047851562 	 kl mean: 9.935394287109375 	 loss mean: 171.619384765625
nll mean: 162.0030517578125 	 kl mean: 9.935394287109375 	 loss mean: 171.93844604492188



 34%|███▍      | 13/38 [00:07<00:14,  1.68it/s][A
                                               
 34%|███▍      | 13/38 [00:07<00:14,  1.68it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.95it/s][A

nll mean: 161.3424835205078 	 kl mean: 9.935394287109375 	 loss mean: 171.2778778076172
nll mean: 162.34434509277344 	 kl mean: 9.935394287109375 	 loss mean: 172.2797393798828



                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.68it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.90it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.68it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.87it/s][A


nll mean: 162.04714965820312 	 kl mean: 9.935394287109375 	 loss mean: 171.98252868652344
nll mean: 162.12718200683594 	 kl mean: 9.935394287109375 	 loss mean: 172.06256103515625


                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.68it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.88it/s][A
                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.68it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.84it/s][A

nll mean: 161.9425048828125 	 kl mean: 9.935394287109375 	 loss mean: 171.87791442871094
nll mean: 161.60354614257812 	 kl mean: 9.935394287109375 	 loss mean: 171.53895568847656



                                               
 34%|███▍      | 13/38 [00:08<00:14,  1.68it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.86it/s][A
                                               
100%|██████████| 10/10 [00:01<00:00,  9.90it/s][A
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s]

nll mean: 161.7295379638672 	 kl mean: 9.935394287109375 	 loss mean: 171.66493225097656
nll mean: 161.9375 	 kl mean: 9.935394287109375 	 loss mean: 171.87289428710938
nll mean: 135.2634735107422 	 kl mean: 8.5446195602417 	 loss mean: 143.80810546875



                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s]
 20%|██        | 2/10 [00:00<00:00, 18.31it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s][A
 40%|████      | 4/10 [00:00<00:00, 18.13it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s][A

nll mean: 135.36959838867188 	 kl mean: 8.5446195602417 	 loss mean: 143.91421508789062
nll mean: 135.49217224121094 	 kl mean: 8.5446195602417 	 loss mean: 144.03680419921875
nll mean: 134.37728881835938 	 kl mean: 8.5446195602417 	 loss mean: 142.92190551757812
nll mean: 135.23660278320312 	 kl mean: 8.5446195602417 	 loss mean: 143.78121948242188



                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s][A
 60%|██████    | 6/10 [00:00<00:00, 18.05it/s][A
                                               
 37%|███▋      | 14/38 [00:08<00:17,  1.39it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.39it/s][A
 80%|████████  | 8/10 [00:00<00:00, 17.99it/s][A
                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.39it/s][A

nll mean: 135.11280822753906 	 kl mean: 8.5446195602417 	 loss mean: 143.6574249267578
nll mean: 134.73330688476562 	 kl mean: 8.5446195602417 	 loss mean: 143.27793884277344
nll mean: 135.09487915039062 	 kl mean: 8.5446195602417 	 loss mean: 143.63949584960938
nll mean: 134.74673461914062 	 kl mean: 8.5446195602417 	 loss mean: 143.29135131835938



                                               
 37%|███▋      | 14/38 [00:09<00:17,  1.39it/s][A
100%|██████████| 10/10 [00:00<00:00, 17.93it/s][A
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s]
 20%|██        | 2/10 [00:00<00:00, 10.70it/s][A

nll mean: 134.9000244140625 	 kl mean: 8.5446195602417 	 loss mean: 143.44464111328125
nll mean: 143.4764404296875 	 kl mean: 9.44464111328125 	 loss mean: 152.92108154296875
nll mean: 143.48594665527344 	 kl mean: 9.44464111328125 	 loss mean: 152.9305877685547



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.72it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A

nll mean: 143.6048126220703 	 kl mean: 9.44464111328125 	 loss mean: 153.0494384765625
nll mean: 143.60821533203125 	 kl mean: 9.44464111328125 	 loss mean: 153.0528564453125
nll mean: 143.0814666748047 	 kl mean: 9.44464111328125 	 loss mean: 152.52609252929688



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.74it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.73it/s][A

nll mean: 143.36354064941406 	 kl mean: 9.44464111328125 	 loss mean: 152.8081817626953
nll mean: 143.65338134765625 	 kl mean: 9.44464111328125 	 loss mean: 153.0980224609375
nll mean: 144.00491333007812 	 kl mean: 9.44464111328125 	 loss mean: 153.4495391845703



                                               
 39%|███▉      | 15/38 [00:09<00:15,  1.49it/s][A
                                               
 39%|███▉      | 15/38 [00:10<00:15,  1.49it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.69it/s][A
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]

nll mean: 143.28533935546875 	 kl mean: 9.44464111328125 	 loss mean: 152.72998046875
nll mean: 142.77757263183594 	 kl mean: 9.44464111328125 	 loss mean: 152.22222900390625
nll mean: 143.9624786376953 	 kl mean: 8.209798812866211 	 loss mean: 152.17227172851562
nll mean: 144.56646728515625 	 kl mean: 8.209798812866211 	 loss mean: 152.77627563476562



                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s]
 30%|███       | 3/10 [00:00<00:00, 24.66it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.50it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A

nll mean: 143.80441284179688 	 kl mean: 8.209798812866211 	 loss mean: 152.0142059326172
nll mean: 144.18943786621094 	 kl mean: 8.209798812866211 	 loss mean: 152.39923095703125
nll mean: 144.2366180419922 	 kl mean: 8.209798812866211 	 loss mean: 152.44642639160156
nll mean: 144.00460815429688 	 kl mean: 8.209798812866211 	 loss mean: 152.2144012451172
nll mean: 144.4674072265625 	 kl mean: 8.209798812866211 	 loss mean: 152.67718505859375



                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
                                               
 42%|████▏     | 16/38 [00:10<00:16,  1.33it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.48it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 24.38it/s][A
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]

nll mean: 144.1505889892578 	 kl mean: 8.209798812866211 	 loss mean: 152.36038208007812
nll mean: 144.45339965820312 	 kl mean: 8.209798812866211 	 loss mean: 152.66319274902344
nll mean: 144.82154846191406 	 kl mean: 8.209798812866211 	 loss mean: 153.03134155273438
nll mean: 134.42974853515625 	 kl mean: 8.794519424438477 	 loss mean: 143.22427368164062
nll mean: 134.1595001220703 	 kl mean: 8.794519424438477 	 loss mean: 142.95401000976562



                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s]
 30%|███       | 3/10 [00:00<00:00, 24.81it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
 60%|██████    | 6/10 [00:00<00:00, 24.76it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A

nll mean: 134.6241455078125 	 kl mean: 8.794519424438477 	 loss mean: 143.4186553955078
nll mean: 134.23660278320312 	 kl mean: 8.794519424438477 	 loss mean: 143.0311279296875
nll mean: 133.3961944580078 	 kl mean: 8.794519424438477 	 loss mean: 142.19070434570312
nll mean: 133.6085205078125 	 kl mean: 8.794519424438477 	 loss mean: 142.40304565429688
nll mean: 133.6506805419922 	 kl mean: 8.794519424438477 	 loss mean: 142.4451904296875



                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
                                               
 45%|████▍     | 17/38 [00:10<00:13,  1.54it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 24.68it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 24.60it/s][A
 47%|████▋     | 18/38 [00:10<00:11,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]

nll mean: 133.68038940429688 	 kl mean: 8.794519424438477 	 loss mean: 142.47491455078125
nll mean: 133.753173828125 	 kl mean: 8.794519424438477 	 loss mean: 142.54766845703125
nll mean: 134.07815551757812 	 kl mean: 8.794519424438477 	 loss mean: 142.8726806640625
nll mean: 129.4644012451172 	 kl mean: 9.864349365234375 	 loss mean: 139.3287353515625



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s]
 20%|██        | 2/10 [00:00<00:00, 12.12it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.19it/s][A

nll mean: 129.9117889404297 	 kl mean: 9.864349365234375 	 loss mean: 139.776123046875
nll mean: 130.07687377929688 	 kl mean: 9.864349365234375 	 loss mean: 139.94122314453125
nll mean: 129.911376953125 	 kl mean: 9.864349365234375 	 loss mean: 139.77574157714844



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.34it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A

nll mean: 130.04208374023438 	 kl mean: 9.864349365234375 	 loss mean: 139.90643310546875
nll mean: 129.78826904296875 	 kl mean: 9.864349365234375 	 loss mean: 139.65261840820312
nll mean: 129.27554321289062 	 kl mean: 9.864349365234375 	 loss mean: 139.139892578125



                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.44it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
                                               
 47%|████▋     | 18/38 [00:11<00:11,  1.73it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.52it/s][A
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 130.4482421875 	 kl mean: 9.864349365234375 	 loss mean: 140.3125762939453
nll mean: 129.41818237304688 	 kl mean: 9.864349365234375 	 loss mean: 139.28253173828125
nll mean: 130.757080078125 	 kl mean: 9.864349365234375 	 loss mean: 140.62142944335938



                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s]
 20%|██        | 2/10 [00:00<00:00, 12.51it/s][A
                                               
 50%|█████     | 19/38 [00:11<00:12,  1.55it/s][A

nll mean: 148.79685974121094 	 kl mean: 9.355218887329102 	 loss mean: 158.15206909179688
nll mean: 149.25640869140625 	 kl mean: 9.355218887329102 	 loss mean: 158.61163330078125
nll mean: 149.02244567871094 	 kl mean: 9.355218887329102 	 loss mean: 158.37765502929688



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.49it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.54it/s][A

nll mean: 149.58233642578125 	 kl mean: 9.355218887329102 	 loss mean: 158.93756103515625
nll mean: 148.96173095703125 	 kl mean: 9.355218887329102 	 loss mean: 158.31692504882812
nll mean: 149.467529296875 	 kl mean: 9.355218887329102 	 loss mean: 158.82275390625



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.48it/s][A
                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A

nll mean: 149.1055908203125 	 kl mean: 9.355218887329102 	 loss mean: 158.4608154296875
nll mean: 148.79446411132812 	 kl mean: 9.355218887329102 	 loss mean: 158.14968872070312
nll mean: 148.3589324951172 	 kl mean: 9.355218887329102 	 loss mean: 157.71414184570312



                                               
 50%|█████     | 19/38 [00:12<00:12,  1.55it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.43it/s][A
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s]
 20%|██        | 2/10 [00:00<00:00, 12.77it/s][A

nll mean: 148.30746459960938 	 kl mean: 9.355218887329102 	 loss mean: 157.6626739501953
nll mean: 156.35580444335938 	 kl mean: 9.009828567504883 	 loss mean: 165.36563110351562
nll mean: 156.09011840820312 	 kl mean: 9.009828567504883 	 loss mean: 165.09991455078125



                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.56it/s][A
                                               
 53%|█████▎    | 20/38 [00:12<00:12,  1.44it/s][A

nll mean: 156.50338745117188 	 kl mean: 9.009828567504883 	 loss mean: 165.51321411132812
nll mean: 156.64382934570312 	 kl mean: 9.009828567504883 	 loss mean: 165.65367126464844
nll mean: 156.69349670410156 	 kl mean: 9.009828567504883 	 loss mean: 165.7033233642578



                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.51it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.44it/s][A

nll mean: 156.22161865234375 	 kl mean: 9.009828567504883 	 loss mean: 165.2314453125
nll mean: 156.64755249023438 	 kl mean: 9.009828567504883 	 loss mean: 165.65737915039062
nll mean: 156.59461975097656 	 kl mean: 9.009828567504883 	 loss mean: 165.60443115234375



                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A
                                               
 53%|█████▎    | 20/38 [00:13<00:12,  1.44it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.39it/s][A
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]

nll mean: 156.3787841796875 	 kl mean: 9.009828567504883 	 loss mean: 165.38861083984375
nll mean: 156.66143798828125 	 kl mean: 9.009828567504883 	 loss mean: 165.6712646484375
nll mean: 117.2162094116211 	 kl mean: 9.440887451171875 	 loss mean: 126.6571044921875



                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s]
 20%|██        | 2/10 [00:00<00:00, 10.15it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s][A
 30%|███       | 3/10 [00:00<00:00, 10.10it/s][A
                                               

nll mean: 117.57335662841797 	 kl mean: 9.440887451171875 	 loss mean: 127.01425170898438
nll mean: 116.9333267211914 	 kl mean: 9.440887451171875 	 loss mean: 126.37422180175781



 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.06it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s][A
                                               
 55%|█████▌    | 21/38 [00:13<00:12,  1.37it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.11it/s][A

nll mean: 116.57373046875 	 kl mean: 9.440887451171875 	 loss mean: 126.01461029052734
nll mean: 117.0252685546875 	 kl mean: 9.440887451171875 	 loss mean: 126.4661636352539
nll mean: 116.99711608886719 	 kl mean: 9.440887451171875 	 loss mean: 126.43800354003906



                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.14it/s][A
                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s][A

nll mean: 117.19782257080078 	 kl mean: 9.440887451171875 	 loss mean: 126.63870239257812
nll mean: 116.97714233398438 	 kl mean: 9.440887451171875 	 loss mean: 126.41802215576172
nll mean: 117.0174560546875 	 kl mean: 9.440887451171875 	 loss mean: 126.45834350585938



                                               
 55%|█████▌    | 21/38 [00:14<00:12,  1.37it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.17it/s][A
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s]
 40%|████      | 4/10 [00:00<00:00, 33.14it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s][A

nll mean: 117.27780151367188 	 kl mean: 9.440887451171875 	 loss mean: 126.71868896484375
nll mean: 106.54464721679688 	 kl mean: 7.874528884887695 	 loss mean: 114.41917419433594
nll mean: 106.3970947265625 	 kl mean: 7.874528884887695 	 loss mean: 114.27162170410156
nll mean: 106.29959106445312 	 kl mean: 7.874528884887695 	 loss mean: 114.17413330078125
nll mean: 106.49479675292969 	 kl mean: 7.874528884887695 	 loss mean: 114.36933135986328
nll mean: 106.36224365234375 	 kl mean: 7.874528884887695 	 loss mean: 114.23677062988281
nll mean: 106.91398620605469 	 kl mean: 7.874528884887695 	 loss mean: 114.78851318359375



                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s][A
 80%|████████  | 8/10 [00:00<00:00, 32.91it/s][A
                                               
 58%|█████▊    | 22/38 [00:14<00:12,  1.24it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 32.66it/s][A
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]

nll mean: 107.27583312988281 	 kl mean: 7.874528884887695 	 loss mean: 115.15037536621094
nll mean: 106.6986312866211 	 kl mean: 7.874528884887695 	 loss mean: 114.57315826416016
nll mean: 106.52350616455078 	 kl mean: 7.874528884887695 	 loss mean: 114.39803314208984
nll mean: 107.74446105957031 	 kl mean: 7.874528884887695 	 loss mean: 115.61898803710938
nll mean: 159.06582641601562 	 kl mean: 8.862276077270508 	 loss mean: 167.9281005859375



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s]
 20%|██        | 2/10 [00:00<00:00, 14.67it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s][A
                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.66it/s][A

nll mean: 158.89581298828125 	 kl mean: 8.862276077270508 	 loss mean: 167.75808715820312
nll mean: 158.59291076660156 	 kl mean: 8.862276077270508 	 loss mean: 167.4552001953125
nll mean: 159.3619384765625 	 kl mean: 8.862276077270508 	 loss mean: 168.22422790527344



                                               
 61%|██████    | 23/38 [00:14<00:09,  1.52it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.69it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s][A

nll mean: 160.043212890625 	 kl mean: 8.862276077270508 	 loss mean: 168.90548706054688
nll mean: 158.90621948242188 	 kl mean: 8.862276077270508 	 loss mean: 167.7685089111328
nll mean: 159.12135314941406 	 kl mean: 8.862276077270508 	 loss mean: 167.98362731933594



                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.74it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s][A
                                               
 61%|██████    | 23/38 [00:15<00:09,  1.52it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.67it/s][A
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]

nll mean: 159.27725219726562 	 kl mean: 8.862276077270508 	 loss mean: 168.1395263671875
nll mean: 159.2432861328125 	 kl mean: 8.862276077270508 	 loss mean: 168.10556030273438
nll mean: 159.20489501953125 	 kl mean: 8.862276077270508 	 loss mean: 168.0671844482422
nll mean: 121.36495208740234 	 kl mean: 10.118062973022461 	 loss mean: 131.48300170898438



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s]
 30%|███       | 3/10 [00:00<00:00, 21.54it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.52it/s][A

nll mean: 120.90086364746094 	 kl mean: 10.118062973022461 	 loss mean: 131.01893615722656
nll mean: 121.08497619628906 	 kl mean: 10.118062973022461 	 loss mean: 131.20303344726562
nll mean: 121.67903900146484 	 kl mean: 10.118062973022461 	 loss mean: 131.79710388183594
nll mean: 120.70002746582031 	 kl mean: 10.118062973022461 	 loss mean: 130.81808471679688
nll mean: 121.85821533203125 	 kl mean: 10.118062973022461 	 loss mean: 131.9762725830078



                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
                                               
 63%|██████▎   | 24/38 [00:15<00:09,  1.50it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.47it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.46it/s][A
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 121.05715942382812 	 kl mean: 10.118062973022461 	 loss mean: 131.1752166748047
nll mean: 121.47076416015625 	 kl mean: 10.118062973022461 	 loss mean: 131.58883666992188
nll mean: 120.54924011230469 	 kl mean: 10.118062973022461 	 loss mean: 130.66729736328125
nll mean: 120.97789001464844 	 kl mean: 10.118062973022461 	 loss mean: 131.095947265625



                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s]
 20%|██        | 2/10 [00:00<00:00, 14.54it/s][A
                                               
 66%|██████▌   | 25/38 [00:15<00:07,  1.65it/s][A

nll mean: 115.27486419677734 	 kl mean: 8.638923645019531 	 loss mean: 123.91378784179688
nll mean: 114.23648071289062 	 kl mean: 8.638923645019531 	 loss mean: 122.87540435791016
nll mean: 114.89789581298828 	 kl mean: 8.638923645019531 	 loss mean: 123.53681945800781



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
 40%|████      | 4/10 [00:00<00:00, 14.60it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
 60%|██████    | 6/10 [00:00<00:00, 14.67it/s][A

nll mean: 114.79255676269531 	 kl mean: 8.638923645019531 	 loss mean: 123.43148040771484
nll mean: 115.02096557617188 	 kl mean: 8.638923645019531 	 loss mean: 123.65989685058594
nll mean: 114.34850311279297 	 kl mean: 8.638923645019531 	 loss mean: 122.9874267578125



                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
 80%|████████  | 8/10 [00:00<00:00, 14.71it/s][A
                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A


nll mean: 115.01768493652344 	 kl mean: 8.638923645019531 	 loss mean: 123.6566162109375
nll mean: 114.76158905029297 	 kl mean: 8.638923645019531 	 loss mean: 123.4005126953125
nll mean: 115.27754211425781 	 kl mean: 8.638923645019531 	 loss mean: 123.91645812988281


                                               
 66%|██████▌   | 25/38 [00:16<00:07,  1.65it/s][A
100%|██████████| 10/10 [00:00<00:00, 14.71it/s][A
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s]
 30%|███       | 3/10 [00:00<00:00, 21.87it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A

nll mean: 114.86318969726562 	 kl mean: 8.638923645019531 	 loss mean: 123.50212097167969
nll mean: 81.56707763671875 	 kl mean: 8.344160079956055 	 loss mean: 89.91123962402344
nll mean: 82.06069946289062 	 kl mean: 8.344160079956055 	 loss mean: 90.40486145019531
nll mean: 81.86358642578125 	 kl mean: 8.344160079956055 	 loss mean: 90.20774841308594
nll mean: 81.16090393066406 	 kl mean: 8.344160079956055 	 loss mean: 89.50506591796875



                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 60%|██████    | 6/10 [00:00<00:00, 22.00it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
                                               
 68%|██████▊   | 26/38 [00:16<00:07,  1.59it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.86it/s][A

nll mean: 81.88483428955078 	 kl mean: 8.344160079956055 	 loss mean: 90.22900390625
nll mean: 81.84953308105469 	 kl mean: 8.344160079956055 	 loss mean: 90.19369506835938
nll mean: 81.33033752441406 	 kl mean: 8.344160079956055 	 loss mean: 89.67449951171875
nll mean: 82.0098876953125 	 kl mean: 8.344160079956055 	 loss mean: 90.35404968261719
nll mean: 81.82655334472656 	 kl mean: 8.344160079956055 	 loss mean: 90.17071533203125



                                               
100%|██████████| 10/10 [00:00<00:00, 21.67it/s][A
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 71%|███████   | 27/38 [00:16<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s]
 30%|███       | 3/10 [00:00<00:00, 21.91it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A

nll mean: 81.95103454589844 	 kl mean: 8.344160079956055 	 loss mean: 90.29520416259766
nll mean: 108.74113464355469 	 kl mean: 8.208187103271484 	 loss mean: 116.94932556152344
nll mean: 108.80899047851562 	 kl mean: 8.208187103271484 	 loss mean: 117.01718139648438
nll mean: 108.89553833007812 	 kl mean: 8.208187103271484 	 loss mean: 117.10372924804688
nll mean: 108.78279876708984 	 kl mean: 8.208187103271484 	 loss mean: 116.99098205566406



                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
                                               
 71%|███████   | 27/38 [00:17<00:06,  1.73it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.77it/s][A

nll mean: 109.41816711425781 	 kl mean: 8.208187103271484 	 loss mean: 117.62635803222656
nll mean: 108.8897705078125 	 kl mean: 8.208187103271484 	 loss mean: 117.09796142578125
nll mean: 108.76997375488281 	 kl mean: 8.208187103271484 	 loss mean: 116.97815704345703
nll mean: 108.20539855957031 	 kl mean: 8.208187103271484 	 loss mean: 116.41358947753906
nll mean: 108.37910461425781 	 kl mean: 8.208187103271484 	 loss mean: 116.58729553222656



                                               
100%|██████████| 10/10 [00:00<00:00, 21.59it/s][A
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s]
 20%|██        | 2/10 [00:00<00:00, 12.47it/s][A

nll mean: 108.59391784667969 	 kl mean: 8.208187103271484 	 loss mean: 116.80209350585938
nll mean: 120.66326904296875 	 kl mean: 9.305398941040039 	 loss mean: 129.96865844726562
nll mean: 120.37137603759766 	 kl mean: 9.305398941040039 	 loss mean: 129.67678833007812



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.53it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s][A

nll mean: 120.7135009765625 	 kl mean: 9.305398941040039 	 loss mean: 130.01889038085938
nll mean: 120.7166976928711 	 kl mean: 9.305398941040039 	 loss mean: 130.0220947265625
nll mean: 120.6269302368164 	 kl mean: 9.305398941040039 	 loss mean: 129.9323272705078



                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.62it/s][A
                                               
 74%|███████▎  | 28/38 [00:17<00:05,  1.83it/s][A
                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.83it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.45it/s][A

nll mean: 121.19017028808594 	 kl mean: 9.305398941040039 	 loss mean: 130.49557495117188
nll mean: 120.78298950195312 	 kl mean: 9.305398941040039 	 loss mean: 130.08837890625
nll mean: 120.61481475830078 	 kl mean: 9.305398941040039 	 loss mean: 129.9202117919922



                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.83it/s][A
                                               
 74%|███████▎  | 28/38 [00:18<00:05,  1.83it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.45it/s][A
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]

nll mean: 120.35317993164062 	 kl mean: 9.305398941040039 	 loss mean: 129.65858459472656
nll mean: 120.20919799804688 	 kl mean: 9.305398941040039 	 loss mean: 129.5146026611328
nll mean: 63.30455017089844 	 kl mean: 10.251903533935547 	 loss mean: 73.55644989013672



                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s]
 20%|██        | 2/10 [00:00<00:00, 10.08it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.99it/s][A


nll mean: 62.20762634277344 	 kl mean: 10.251903533935547 	 loss mean: 72.45953369140625
nll mean: 63.31315612792969 	 kl mean: 10.251903533935547 	 loss mean: 73.5650634765625


                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s][A
 50%|█████     | 5/10 [00:00<00:00, 10.04it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s][A

nll mean: 63.50942611694336 	 kl mean: 10.251903533935547 	 loss mean: 73.76132202148438
nll mean: 62.33061218261719 	 kl mean: 10.251903533935547 	 loss mean: 72.58250427246094
nll mean: 63.1827507019043 	 kl mean: 10.251903533935547 	 loss mean: 73.43465423583984



 60%|██████    | 6/10 [00:00<00:00,  9.99it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s][A
                                               
 76%|███████▋  | 29/38 [00:18<00:05,  1.60it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.10it/s][A
                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s][A

nll mean: 62.73846435546875 	 kl mean: 10.251903533935547 	 loss mean: 72.99037170410156
nll mean: 62.32941436767578 	 kl mean: 10.251903533935547 	 loss mean: 72.5813217163086
nll mean: 62.32474136352539 	 kl mean: 10.251903533935547 	 loss mean: 72.57664489746094



                                               
 76%|███████▋  | 29/38 [00:19<00:05,  1.60it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.12it/s][A
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s]
 20%|██        | 2/10 [00:00<00:00, 12.73it/s][A

nll mean: 62.83123779296875 	 kl mean: 10.251903533935547 	 loss mean: 73.08314514160156
nll mean: 105.8995590209961 	 kl mean: 9.634160041809082 	 loss mean: 115.53372192382812
nll mean: 105.1291275024414 	 kl mean: 9.634160041809082 	 loss mean: 114.7632827758789



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.57it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A

nll mean: 104.96634674072266 	 kl mean: 9.634160041809082 	 loss mean: 114.60050964355469
nll mean: 105.31685638427734 	 kl mean: 9.634160041809082 	 loss mean: 114.95101165771484
nll mean: 106.1646728515625 	 kl mean: 9.634160041809082 	 loss mean: 115.798828125



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.46it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.46it/s][A

nll mean: 105.81012725830078 	 kl mean: 9.634160041809082 	 loss mean: 115.44429016113281
nll mean: 105.70967102050781 	 kl mean: 9.634160041809082 	 loss mean: 115.34383392333984
nll mean: 105.36469268798828 	 kl mean: 9.634160041809082 	 loss mean: 114.99885559082031



                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
                                               
 79%|███████▉  | 30/38 [00:19<00:05,  1.36it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.42it/s][A
 82%|████████▏ | 31/38 [00:19<00:05,  1.32it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]

nll mean: 105.50191497802734 	 kl mean: 9.634160041809082 	 loss mean: 115.13607025146484
nll mean: 105.42298889160156 	 kl mean: 9.634160041809082 	 loss mean: 115.05714416503906
nll mean: 139.52749633789062 	 kl mean: 9.889022827148438 	 loss mean: 149.41651916503906



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s]
 20%|██        | 2/10 [00:00<00:00, 10.00it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s][A
 30%|███       | 3/10 [00:00<00:00,  9.97it/s][A

nll mean: 139.7360076904297 	 kl mean: 9.889022827148438 	 loss mean: 149.62503051757812
nll mean: 139.90322875976562 	 kl mean: 9.889022827148438 	 loss mean: 149.792236328125



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s][A
 40%|████      | 4/10 [00:00<00:00,  9.91it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s][A
 50%|█████     | 5/10 [00:00<00:00,  9.86it/s][A

nll mean: 139.56643676757812 	 kl mean: 9.889022827148438 	 loss mean: 149.45545959472656
nll mean: 140.49746704101562 	 kl mean: 9.889022827148438 	 loss mean: 150.38648986816406



                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s][A
 60%|██████    | 6/10 [00:00<00:00,  9.83it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s][A
 70%|███████   | 7/10 [00:00<00:00,  9.85it/s][A
[A                                           

nll mean: 139.52914428710938 	 kl mean: 9.889022827148438 	 loss mean: 149.41818237304688
nll mean: 139.2542266845703 	 kl mean: 9.889022827148438 	 loss mean: 149.14324951171875


                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s][A
 80%|████████  | 8/10 [00:00<00:00,  9.87it/s][A
                                               
 82%|████████▏ | 31/38 [00:20<00:05,  1.32it/s][A
 90%|█████████ | 9/10 [00:00<00:00,  9.90it/s][A

nll mean: 139.21986389160156 	 kl mean: 9.889022827148438 	 loss mean: 149.10890197753906
nll mean: 139.15008544921875 	 kl mean: 9.889022827148438 	 loss mean: 149.03912353515625



                                               
 82%|████████▏ | 31/38 [00:21<00:05,  1.32it/s][A
100%|██████████| 10/10 [00:01<00:00,  9.83it/s][A
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
 30%|███       | 3/10 [00:00<00:00, 25.97it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s][A
                                               
 30%|███       | 3/10 [00:00<00:00, 25.97it/s]

nll mean: 139.50906372070312 	 kl mean: 9.889022827148438 	 loss mean: 149.39808654785156
nll mean: 63.18902587890625 	 kl mean: 8.543086051940918 	 loss mean: 71.73210906982422
nll mean: 63.523582458496094 	 kl mean: 8.543086051940918 	 loss mean: 72.06668090820312
nll mean: 63.53467559814453 	 kl mean: 8.543086051940918 	 loss mean: 72.0777587890625
nll mean: 62.90361785888672 	 kl mean: 8.543086051940918 	 loss mean: 71.44670867919922
nll mean: 62.671775817871094 	 kl mean: 8.543086051940918 	 loss mean: 71.21485900878906


 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s]
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s][A
 60%|██████    | 6/10 [00:00<00:00, 25.68it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s][A
                                               
 84%|████████▍ | 32/38 [00:21<00:05,  1.20it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 25.67it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 25.49it/s][A
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 63.33992004394531 	 kl mean: 8.543086051940918 	 loss mean: 71.88300323486328
nll mean: 63.382225036621094 	 kl mean: 8.543086051940918 	 loss mean: 71.92530822753906
nll mean: 63.344966888427734 	 kl mean: 8.543086051940918 	 loss mean: 71.88805389404297
nll mean: 63.055702209472656 	 kl mean: 8.543086051940918 	 loss mean: 71.59879302978516
nll mean: 63.250205993652344 	 kl mean: 8.543086051940918 	 loss mean: 71.79328918457031



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s]
 30%|███       | 3/10 [00:00<00:00, 21.36it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A

nll mean: 118.88893127441406 	 kl mean: 8.183547973632812 	 loss mean: 127.07247924804688
nll mean: 119.24819946289062 	 kl mean: 8.183547973632812 	 loss mean: 127.43174743652344
nll mean: 119.51341247558594 	 kl mean: 8.183547973632812 	 loss mean: 127.69696807861328
nll mean: 119.43643951416016 	 kl mean: 8.183547973632812 	 loss mean: 127.61997985839844
nll mean: 118.97055053710938 	 kl mean: 8.183547973632812 	 loss mean: 127.15409851074219



                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.29it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A
                                               
 87%|████████▋ | 33/38 [00:21<00:03,  1.42it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.27it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.22it/s][A
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A

nll mean: 119.05348205566406 	 kl mean: 8.183547973632812 	 loss mean: 127.23703002929688
nll mean: 120.1036376953125 	 kl mean: 8.183547973632812 	 loss mean: 128.28720092773438
nll mean: 119.23263549804688 	 kl mean: 8.183547973632812 	 loss mean: 127.41618347167969
nll mean: 119.40951538085938 	 kl mean: 8.183547973632812 	 loss mean: 127.59306335449219
nll mean: 119.42803955078125 	 kl mean: 8.183547973632812 	 loss mean: 127.61158752441406



                                               
 89%|████████▉ | 34/38 [00:21<00:02,  1.58it/s]
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s]
 20%|██        | 2/10 [00:00<00:00, 12.81it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A

nll mean: 120.23808288574219 	 kl mean: 9.529041290283203 	 loss mean: 129.76712036132812
nll mean: 120.15451049804688 	 kl mean: 9.529041290283203 	 loss mean: 129.6835479736328
nll mean: 120.18936157226562 	 kl mean: 9.529041290283203 	 loss mean: 129.71841430664062



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
 40%|████      | 4/10 [00:00<00:00, 12.76it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
 60%|██████    | 6/10 [00:00<00:00, 12.59it/s][A

nll mean: 120.13436889648438 	 kl mean: 9.529041290283203 	 loss mean: 129.6634063720703
nll mean: 120.9901123046875 	 kl mean: 9.529041290283203 	 loss mean: 130.51914978027344
nll mean: 120.31550598144531 	 kl mean: 9.529041290283203 	 loss mean: 129.84454345703125



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
 80%|████████  | 8/10 [00:00<00:00, 12.49it/s][A
                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A

nll mean: 120.45280456542969 	 kl mean: 9.529041290283203 	 loss mean: 129.9818572998047
nll mean: 120.44972229003906 	 kl mean: 9.529041290283203 	 loss mean: 129.978759765625
nll mean: 120.77516174316406 	 kl mean: 9.529041290283203 	 loss mean: 130.30419921875



                                               
 89%|████████▉ | 34/38 [00:22<00:02,  1.58it/s][A
100%|██████████| 10/10 [00:00<00:00, 12.45it/s][A
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s]
 20%|██        | 2/10 [00:00<00:00, 10.70it/s][A

nll mean: 120.38189697265625 	 kl mean: 9.529041290283203 	 loss mean: 129.9109344482422
nll mean: 114.13948822021484 	 kl mean: 8.800617218017578 	 loss mean: 122.94010162353516
nll mean: 113.45616912841797 	 kl mean: 8.800617218017578 	 loss mean: 122.25679016113281



                                               
 92%|█████████▏| 35/38 [00:22<00:02,  1.46it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 40%|████      | 4/10 [00:00<00:00, 10.67it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A

nll mean: 113.50926208496094 	 kl mean: 8.800617218017578 	 loss mean: 122.30987548828125
nll mean: 113.93722534179688 	 kl mean: 8.800617218017578 	 loss mean: 122.73783874511719
nll mean: 113.44026947021484 	 kl mean: 8.800617218017578 	 loss mean: 122.24089050292969



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 60%|██████    | 6/10 [00:00<00:00, 10.67it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
 80%|████████  | 8/10 [00:00<00:00, 10.63it/s][A

nll mean: 113.3631362915039 	 kl mean: 8.800617218017578 	 loss mean: 122.16374969482422
nll mean: 113.51099395751953 	 kl mean: 8.800617218017578 	 loss mean: 122.31161499023438
nll mean: 113.66567993164062 	 kl mean: 8.800617218017578 	 loss mean: 122.46630096435547



                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
                                               
 92%|█████████▏| 35/38 [00:23<00:02,  1.46it/s][A
100%|██████████| 10/10 [00:00<00:00, 10.61it/s][A
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]

nll mean: 113.08512115478516 	 kl mean: 8.800617218017578 	 loss mean: 121.8857421875
nll mean: 113.99153137207031 	 kl mean: 8.800617218017578 	 loss mean: 122.79215240478516
nll mean: 111.13726806640625 	 kl mean: 9.077619552612305 	 loss mean: 120.21488189697266
nll mean: 111.69073486328125 	 kl mean: 9.077619552612305 	 loss mean: 120.76834869384766



                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s]
 30%|███       | 3/10 [00:00<00:00, 21.27it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A
 60%|██████    | 6/10 [00:00<00:00, 21.30it/s][A
                                               
 95%|█████████▍| 36/38 [00:23<00:01,  1.31it/s][A

nll mean: 111.18386840820312 	 kl mean: 9.077619552612305 	 loss mean: 120.26148223876953
nll mean: 111.56610107421875 	 kl mean: 9.077619552612305 	 loss mean: 120.64372253417969
nll mean: 111.880859375 	 kl mean: 9.077619552612305 	 loss mean: 120.95848083496094
nll mean: 111.89889526367188 	 kl mean: 9.077619552612305 	 loss mean: 120.97650909423828
nll mean: 111.51011657714844 	 kl mean: 9.077619552612305 	 loss mean: 120.58773803710938



                                               
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s][A
                                               
 95%|█████████▍| 36/38 [00:24<00:01,  1.31it/s][A
 90%|█████████ | 9/10 [00:00<00:00, 21.21it/s][A
                                               
100%|██████████| 10/10 [00:00<00:00, 21.24it/s][A
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
  0%|          | 0/10 [00:00<?, ?it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]

nll mean: 111.8063735961914 	 kl mean: 9.077619552612305 	 loss mean: 120.88400268554688
nll mean: 112.31680297851562 	 kl mean: 9.077619552612305 	 loss mean: 121.39442443847656
nll mean: 111.49262237548828 	 kl mean: 9.077619552612305 	 loss mean: 120.57024383544922
nll mean: 86.4000473022461 	 kl mean: 10.26272964477539 	 loss mean: 96.66278076171875
nll mean: 85.66909790039062 	 kl mean: 10.26272964477539 	 loss mean: 95.93183898925781
nll mean: 85.55380249023438 	 kl mean: 10.26272964477539 	 loss mean: 95.8165283203125



                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s]
 40%|████      | 4/10 [00:00<00:00, 30.29it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s][A
 80%|████████  | 8/10 [00:00<00:00, 30.31it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s][A
                                               
 97%|█████████▋| 37/38 [00:24<00:00,  1.48it/s][A

nll mean: 85.82894897460938 	 kl mean: 10.26272964477539 	 loss mean: 96.0916748046875
nll mean: 84.88636016845703 	 kl mean: 10.26272964477539 	 loss mean: 95.14909362792969
nll mean: 85.14442443847656 	 kl mean: 10.26272964477539 	 loss mean: 95.40715789794922
nll mean: 85.46232604980469 	 kl mean: 10.26272964477539 	 loss mean: 95.72505187988281
nll mean: 86.04447937011719 	 kl mean: 10.26272964477539 	 loss mean: 96.30721282958984
nll mean: 84.94355773925781 	 kl mean: 10.26272964477539 	 loss mean: 95.20629119873047
nll mean: 86.26445007324219 	 kl mean: 10.26272964477539 	 loss mean: 96.52718353271484


100%|██████████| 10/10 [00:00<00:00, 30.18it/s]
100%|██████████| 38/38 [00:24<00:00,  1.55it/s]


Approximate NLL:
tensor(121.6202, device='cuda:0')
Approximate KL:
tensor(9.1793, device='cuda:0')
Testing took 0:00:25.444497


In [25]:
print(vanilla_nlls, vanilla_kls)

[tensor(126.9970, device='cuda:0'), tensor(127.1339, device='cuda:0'), tensor(127.0737, device='cuda:0'), tensor(126.7274, device='cuda:0')] [tensor(0.0486, device='cuda:0'), tensor(0.0453, device='cuda:0'), tensor(0.0573, device='cuda:0'), tensor(0.0670, device='cuda:0')]


In [26]:
print(wd_nlls, wd_kls)

[tensor(126.3611, device='cuda:0'), tensor(127.2960, device='cuda:0'), tensor(126.4909, device='cuda:0'), tensor(126.9019, device='cuda:0')] [tensor(1.2080, device='cuda:0'), tensor(1.0724, device='cuda:0'), tensor(1.4329, device='cuda:0'), tensor(1.1597, device='cuda:0')]


In [27]:
print(fb_nlls, fb_kls)

[tensor(121.0295, device='cuda:0'), tensor(120.7947, device='cuda:0'), tensor(120.9791, device='cuda:0'), tensor(121.1578, device='cuda:0')] [tensor(8.1792, device='cuda:0'), tensor(8.3366, device='cuda:0'), tensor(8.2716, device='cuda:0'), tensor(8.2359, device='cuda:0')]


In [28]:
print(mdr_nlls, mdr_kls)

[tensor(119.7677, device='cuda:0'), tensor(119.8687, device='cuda:0'), tensor(120.0548, device='cuda:0'), tensor(119.5421, device='cuda:0')] [tensor(9.7394, device='cuda:0'), tensor(9.5362, device='cuda:0'), tensor(9.7923, device='cuda:0'), tensor(9.5691, device='cuda:0')]


In [29]:
print(wd_fb_nlls, wd_fb_kls)

[tensor(121.8104, device='cuda:0'), tensor(121.3209, device='cuda:0'), tensor(121.2213, device='cuda:0'), tensor(121.8890, device='cuda:0')] [tensor(8.4971, device='cuda:0'), tensor(8.7278, device='cuda:0'), tensor(8.8820, device='cuda:0'), tensor(9.1538, device='cuda:0')]


In [30]:
print(wd_mdr_nlls, wd_mdr_kls)

[tensor(120.9362, device='cuda:0'), tensor(121.1414, device='cuda:0'), tensor(120.5020, device='cuda:0'), tensor(121.6202, device='cuda:0')] [tensor(8.9841, device='cuda:0'), tensor(9.4737, device='cuda:0'), tensor(9.8161, device='cuda:0'), tensor(9.1793, device='cuda:0')]


# Results

In [31]:
all_results = {
    "Vanilla": torch.tensor(vanilla_nlls),
    "Word dropout": torch.tensor(wd_nlls),
    "Free Bits": torch.tensor(fb_nlls),
    "MDR": torch.tensor(mdr_nlls),
    "Word dropout & Free Bits": torch.tensor(wd_fb_nlls),
    "Word dropout & MDR": torch.tensor(wd_mdr_nlls),
}

In [32]:
for name, res in all_results.items():
    std, mean = torch.std_mean(res)
    print(f"{name: >30} approximated NLL: \t {mean} \t +- {std}")

                       Vanilla approximated NLL: 	 126.9830093383789 	 +- 0.17940175533294678
                  Word dropout approximated NLL: 	 126.76248168945312 	 +- 0.4238397181034088
                     Free Bits approximated NLL: 	 120.9902572631836 	 +- 0.15050916373729706
                           MDR approximated NLL: 	 119.80831146240234 	 +- 0.21363131701946259
      Word dropout & Free Bits approximated NLL: 	 121.56041717529297 	 +- 0.33803650736808777
            Word dropout & MDR approximated NLL: 	 121.04994201660156 	 +- 0.4643072783946991


In [33]:
all_results = {
    "Vanilla": torch.tensor(vanilla_kls),
    "Word dropout": torch.tensor(wd_kls),
    "Free Bits": torch.tensor(fb_kls),
    "MDR": torch.tensor(mdr_kls),
    "Word dropout & Free Bits": torch.tensor(wd_fb_kls),
    "Word dropout & MDR": torch.tensor(wd_mdr_kls),
}

In [35]:
for name, res in all_results.items():
    std, mean = torch.std_mean(res)
    print(f"{name: >30} approximated KL: \t {mean} \t +- {std}")

                       Vanilla approximated KL: 	 0.054543379694223404 	 +- 0.00971465464681387
                  Word dropout approximated KL: 	 1.21824312210083 	 +- 0.15374356508255005
                     Free Bits approximated KL: 	 8.255844116210938 	 +- 0.06594689935445786
                           MDR approximated KL: 	 9.65927505493164 	 +- 0.1257069706916809
      Word dropout & Free Bits approximated KL: 	 8.815167427062988 	 +- 0.2756330668926239
            Word dropout & MDR approximated KL: 	 9.36330509185791 	 +- 0.36282771825790405
