In [1]:
!pip install neuralforecast

Defaulting to user installation because normal site-packages is not writeable

[1m[[0m[34;49mnotice[0m[1;39;49m][0m[39;49m A new release of pip is available: [0m[31;49m23.0.1[0m[39;49m -> [0m[32;49m23.1.2[0m
[1m[[0m[34;49mnotice[0m[1;39;49m][0m[39;49m To update, run: [0m[32;49mpython3 -m pip install --upgrade pip[0m


In [3]:
from ray import tune
import time
import logging
import os
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt

from neuralforecast import NeuralForecast
from neuralforecast.auto import AutoRNN, AutoLSTM, AutoGRU, AutoTCN, AutoDilatedRNN

  from pandas.core.computation.check import NUMEXPR_INSTALLED
  warn(f"Failed to load image Python extension: {e}")


In [4]:
def load_data(file_path):
    df = (pd.read_csv(file_path)
          .rename(columns={"year_quarter": "ds", "GDPC1": "y"})
          .assign(unique_id=np.ones(len(pd.read_csv(file_path))),
                  ds=lambda df: pd.to_datetime(df['ds'])))
    columns_order = ["unique_id", "ds", "y"] + \
        [col for col in df.columns if col not in ["unique_id", "ds", "y"]]
    df['ds'] = df['ds'] - pd.Timedelta(days=1)
    return df[columns_order]


def separate_covariates(df, point_in_time):
    covariates = df.drop(columns=["unique_id", "ds", "y"])

    if not point_in_time:
        return df[covariates.columns], df[[]]

    mask = covariates.apply(
        lambda col: col.loc[col.index >= point_in_time - 1].isnull().any())

    past_covariates = df[mask.index[mask]]
    future_covariates = df[mask.index[~mask]]

    return past_covariates, future_covariates


def impute_missing_values_interpolate(data, method='linear'):
    imputed_data = data.copy()
    imputed_data.fillna(method='bfill', inplace=True)
    return imputed_data.interpolate(method=method)


### Different vintages ###


def forecast_vintage(vintage_file, horizon=4):
    results = {}

    df = load_data(vintage_file)

    target_df = df[["unique_id", "ds", "y"]]

    point_in_time = df.index[-2]

    past_covariates, future_covariates = separate_covariates(
        df, point_in_time)

    df_pc = impute_missing_values_interpolate(past_covariates)
    df_fc = impute_missing_values_interpolate(future_covariates)

    pcc_list = past_covariates.columns.tolist()
    fcc_list = future_covariates.columns.tolist()

    df = (target_df
          .merge(df_fc, left_index=True, right_index=True)
          .merge(df_pc, left_index=True, right_index=True)
          .iloc[:-1])

    futr_df = (target_df
               .merge(future_covariates, left_index=True, right_index=True)
               .drop(columns="y")
               .iloc[-1:])


    mlp_config = {
        "input_size": tune.choice([2, 4, 8, 12, 20]), # think about this tuning choice
        "hidden_size": tune.choice([256, 512, 1024]),
        "num_layers": tune.randint(2, 6),
        "learning_rate": tune.loguniform(1e-4, 1e-1),
        "batch_size": tune.choice([32, 64, 128, 256]),
        "windows_batch_size": tune.choice([128, 256, 512, 1024]),
        "random_seed": tune.randint(1, 20),
        "hist_exog_list": tune.choice([pcc_list]),
        "futr_exog_list": tune.choice([fcc_list]),
        "max_steps": tune.choice([500, 1000]),
        "scaler_type": tune.choice(["robust"]),
    }

    # nbeats_config = {
    #     "input_size": tune.choice([2, 4, 12, 20]), # think about this tuning choice
    #     "learning_rate": tune.loguniform(1e-4, 1e-1),
    #     "scaler_type": tune.choice(["robust"]),
    #     "batch_size": tune.choice([32, 64, 128, 256]),
    #     "windows_batch_size": tune.choice([128, 256, 512, 1024]),
    #     #"dropout_prob_theta": tune.choice([0.1, 0.3, 0.5]),
    #     # "early_stop_patience_steps": tune.choice([-1, 2, 5]),
    #     #"hist_exog_list": tune.choice([pcc_list]),
    #     #"futr_exog_list": tune.choice([fcc_list]),
    #     "max_steps": tune.choice([500, 1000]),
    #     "random_seed": tune.randint(1, 20)
    # }

    nbeatsx_config = {
        "input_size": tune.choice([2, 4, 8, 12, 20]), # think about this tuning choice
        "learning_rate": tune.loguniform(1e-4, 1e-1),
        "scaler_type": tune.choice(["robust"]),
        "batch_size": tune.choice([32, 64, 128, 256]),
        "windows_batch_size": tune.choice([128, 256, 512, 1024]),
        #"dropout_prob_theta": tune.choice([0.1, 0.3, 0.5]),
        # "early_stop_patience_steps": tune.choice([-1, 2, 5]),
        "hist_exog_list": tune.choice([pcc_list]),
        "futr_exog_list": tune.choice([fcc_list]),
        "max_steps": tune.choice([500, 1000]),
        "random_seed": tune.randint(1, 20)
    }

    nhits_config = {
        "n_pool_kernel_size": tune.choice(
            [[2, 2, 1], 3 * [1], 3 * [2], 3 * [4], [8, 4, 1], [16, 8, 1]]
        ),
        "n_freq_downsample": tune.choice(
            [
                [168, 24, 1],
                [24, 12, 1],
                [180, 60, 1],
                [60, 8, 1],
                [40, 20, 1],
                [1, 1, 1],
            ]
        ),
        "input_size": tune.choice([2, 4, 8, 12, 20]), # think about this tuning choice
        "learning_rate": tune.loguniform(1e-4, 1e-1),
        "scaler_type": tune.choice(["robust"]),
        "batch_size": tune.choice([32, 64, 128, 256]),
        "windows_batch_size": tune.choice([128, 256, 512, 1024]),
        #"dropout_prob_theta": tune.choice([0.1, 0.3, 0.5]),
        #"early_stop_patience_steps": tune.choice([-1, 2, 5]),
        "hist_exog_list": tune.choice([pcc_list]),
        "futr_exog_list": tune.choice([fcc_list]),
        "max_steps": tune.choice([500, 1000]),
        "random_seed": tune.randint(lower=1, upper=20),
    }

    # Define models and their configurations
    models = {  
    "AutoMLP": {"config": mlp_config},
    # "AutoNBEATS": {"config": nbeats_config},
    "AutoNBEATSx": {"config": nbeatsx_config},
    "AutoNHITS": {"config": nhits_config},
    }

    model_instances = []

    for model_name, kwargs in models.items():
        print(f"Running model: {model_name}")
        model_class = globals()[model_name]
        # instance = model_class(h=horizon, num_samples=1, search_alg=HyperOptSearch(), loss=MAE(), **kwargs) 
        instance = model_class(h=horizon, num_samples=30, **kwargs) 
        model_instances.append(instance)

    nf = NeuralForecast(models=model_instances, freq='Q')
    nf.fit(df=df)

    Y_hat_df = nf.predict(futr_df=futr_df)
    forecast_value = Y_hat_df.iloc[:, 1].values.tolist()

    results[vintage_file] = forecast_value

    Y_hat_df = Y_hat_df.reset_index()

    return Y_hat_df, results 

In [5]:
comparison = pd.DataFrame()
results = {}

vintage_files = [
    f'data/vintage_{year}_{month:02d}.csv'
    for year in range(2018, 2024)
    for month in range(1, 13)
    if not (
        (year == 2018 and month < 5) or
        (year == 2023 and month > 2)
    )
]

In [None]:

total_vintages = len(vintage_files)

start_time_whole = time.time()

def write_to_csv(df, block_number):
    df.to_csv(f'results/mlp_results_{block_number}.csv', index=False)

block_size = 1
for i in range(0, len(vintage_files), block_size):
    block = vintage_files[i:i+block_size]
    for j, vintage_file in enumerate(block):
        print(f"Processing {vintage_file} ({j+1}/{block_size}) in block {i//block_size + 1}")
        vintage_comparison, vintage_results = forecast_vintage(vintage_file)

        vintage_file_name = os.path.basename(vintage_file)  
        vintage_file_name = os.path.splitext(vintage_file_name)[0] 
        vintage_comparison = vintage_comparison.assign(vintage_file = vintage_file_name)

        comparison = pd.concat([comparison, vintage_comparison], ignore_index=True)
        
        results.update(vintage_results)
    
    write_to_csv(comparison, i//block_size + 1)



end_time_whole = time.time()

time_diff = end_time_whole - start_time_whole
hours, remainder = divmod(time_diff, 3600)
minutes, seconds = divmod(remainder, 60)

print(f"Time taken to run the code: {int(hours)} hour(s), {int(minutes)} minute(s), and {seconds:.2f} seconds")

[2m[36m(pid=701377)[0m   from pandas.core.computation.check import NUMEXPR_INSTALLED
[2m[36m(pid=701377)[0m   warn(f"Failed to load image Python extension: {e}")
[2m[36m(train_tune pid=701377)[0m Global seed set to 17
[2m[36m(train_tune pid=701377)[0m --------------------------------------------------------------------------
[2m[36m(train_tune pid=701377)[0m detected:
[2m[36m(train_tune pid=701377)[0m 
[2m[36m(train_tune pid=701377)[0m   Local host:            152-67-225-75
[2m[36m(train_tune pid=701377)[0m   Device name:           mlx5_0
[2m[36m(train_tune pid=701377)[0m   Device vendor ID:      0x02c9
[2m[36m(train_tune pid=701377)[0m   Device vendor part ID: 4126
[2m[36m(train_tune pid=701377)[0m 
[2m[36m(train_tune pid=701377)[0m Default device parameters will be used, which may result in lower
[2m[36m(train_tune pid=701377)[0m performance.  You can edit any of the files specified by the
[2m[36m(train_tune pid=701377)[0m btl_openib_device_p

Sanity Checking DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/1 [00:00<?, ?it/s]                             
Epoch 13:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.200, train_loss_epoch=1.200]         
Epoch 13: 100%|██████████| 1/1 [00:00<00:00, 153.48it/s, v_num=0, train_loss_step=0.846, train_loss_epoch=0.846]
Epoch 14:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.846, train_loss_epoch=0.846]         
Epoch 27: 100%|██████████| 1/1 [00:00<00:00, 139.81it/s, v_num=0, train_loss_step=0.549, train_loss_epoch=0.549]
Epoch 28:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.549, train_loss_epoch=0.549]         
Epoch 42:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.337, train_loss_epoch=0.337]         
Epoch 56:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.718, train_loss_epoch=0.718]         
Epoch 70:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_lo

[2m[36m(train_tune pid=701377)[0m Global seed set to 18


Epoch 8:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.210, train_loss_epoch=1.210]         
Epoch 9:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.210, train_loss_epoch=1.210]
Epoch 23:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.340, train_loss_epoch=2.340]         
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.538, train_loss_epoch=0.538]         
Epoch 51: 100%|██████████| 1/1 [00:00<00:00, 159.47it/s, v_num=0, train_loss_step=0.874, train_loss_epoch=0.874]
Epoch 52:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.874, train_loss_epoch=0.874]         
Epoch 66:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.416, train_loss_epoch=0.416]         
Epoch 80:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.110, train_loss_epoch=1.110]         
Epoch 94:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.335, train_loss_epoch=0.335]    

[2m[36m(train_tune pid=701377)[0m Global seed set to 8


Epoch 26: 100%|██████████| 1/1 [00:00<00:00, 159.87it/s, v_num=0, train_loss_step=1.600, train_loss_epoch=1.600]
Epoch 27:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.600, train_loss_epoch=1.600]         
Epoch 41:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.440, train_loss_epoch=1.440]         
Epoch 41: 100%|██████████| 1/1 [00:00<00:00, 162.46it/s, v_num=0, train_loss_step=0.457, train_loss_epoch=0.457]
Epoch 42:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.457, train_loss_epoch=0.457]         
Epoch 56:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.040, train_loss_epoch=1.040]         
Epoch 56: 100%|██████████| 1/1 [00:00<00:00, 131.26it/s, v_num=0, train_loss_step=0.577, train_loss_epoch=0.577]
Epoch 57:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.577, train_loss_epoch=0.577]         
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.170, train_loss_epoch

[2m[36m(train_tune pid=701377)[0m Global seed set to 9


Epoch 21: 100%|██████████| 1/1 [00:00<00:00, 149.55it/s, v_num=0, train_loss_step=5.520, train_loss_epoch=7.860]
Epoch 22:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.520, train_loss_epoch=5.520]         
Epoch 35:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=8.500, train_loss_epoch=8.500]         
Epoch 48: 100%|██████████| 1/1 [00:00<00:00, 140.02it/s, v_num=0, train_loss_step=1.830, train_loss_epoch=1.830]
Epoch 49:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.830, train_loss_epoch=1.830]         
Epoch 62:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.150, train_loss_epoch=3.150]         
Epoch 75:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=8.370, train_loss_epoch=8.370]         
Epoch 75: 100%|██████████| 1/1 [00:00<00:00, 141.45it/s, v_num=0, train_loss_step=1.520, train_loss_epoch=1.520]
Epoch 76:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.520, train_loss_epoch

[2m[36m(train_tune pid=701377)[0m Global seed set to 12


Epoch 20:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.020, train_loss_epoch=1.020]         
Epoch 35:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=20.90, train_loss_epoch=20.90]         
Epoch 49:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.510, train_loss_epoch=2.510]         
Epoch 63: 100%|██████████| 1/1 [00:00<00:00, 138.49it/s, v_num=0, train_loss_step=37.00, train_loss_epoch=37.00]
Epoch 64:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=37.00, train_loss_epoch=37.00]         
Epoch 78:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.450, train_loss_epoch=1.450]         
Epoch 79:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=14.40, train_loss_epoch=14.40]         
Epoch 93:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.790, train_loss_epoch=1.790]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 162.94it/s, v_num=0, train_loss_step=6.280, train_l

[2m[36m(train_tune pid=701377)[0m Global seed set to 1


Epoch 10:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.725, train_loss_epoch=0.725]        
Epoch 24:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.330, train_loss_epoch=1.330]         
Epoch 24:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.270, train_loss_epoch=1.270]         
Epoch 25:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.270, train_loss_epoch=1.270]
Epoch 39:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.911, train_loss_epoch=0.911]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.709, train_loss_epoch=0.709]         
Epoch 68:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.785, train_loss_epoch=0.785]         
Epoch 68: 100%|██████████| 1/1 [00:00<00:00, 170.49it/s, v_num=0, train_loss_step=0.785, train_loss_epoch=0.785]
Epoch 69:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.090, train_loss_epoch=1.090]   

[2m[36m(train_tune pid=701377)[0m Global seed set to 2


Epoch 3:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.890, train_loss_epoch=1.890]        
Epoch 9:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.170, train_loss_epoch=1.170]        
Epoch 15:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.160, train_loss_epoch=1.160]         
Epoch 21:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.943, train_loss_epoch=0.943]        
Epoch 26: 100%|██████████| 1/1 [00:00<00:00, 77.89it/s, v_num=0, train_loss_step=0.741, train_loss_epoch=1.190]
Epoch 26: 100%|██████████| 1/1 [00:00<00:00, 65.83it/s, v_num=0, train_loss_step=0.741, train_loss_epoch=0.741]
Epoch 27:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.741, train_loss_epoch=0.741]        
Epoch 32:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.941, train_loss_epoch=0.941]        
Epoch 38:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.800, train_loss_epoch=2.800]  

[2m[36m(train_tune pid=701377)[0m Global seed set to 15


Epoch 5:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.666, train_loss_epoch=0.666]         
Epoch 11:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.080, train_loss_epoch=1.080]        
Epoch 16:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.450, train_loss_epoch=1.450]        
Epoch 22:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.852, train_loss_epoch=0.852]        
Epoch 27:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.866, train_loss_epoch=0.866]        
Epoch 28:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=22.50, train_loss_epoch=22.50]        
Epoch 33:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.660, train_loss_epoch=1.660]        
Epoch 39:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.610, train_loss_epoch=2.610]        
Epoch 44: 100%|██████████| 1/1 [00:00<00:00, 67.07it/s, v_num=0, train_loss_step=1.430, train_loss_epoch

[2m[36m(train_tune pid=701377)[0m Global seed set to 10


Epoch 6:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.030, train_loss_epoch=1.030]        
Epoch 12:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.070, train_loss_epoch=2.070]        
Epoch 18:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.791, train_loss_epoch=0.791]         
Epoch 24:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.700, train_loss_epoch=1.700]        
Epoch 29:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.596, train_loss_epoch=0.596]        
Epoch 35:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.240, train_loss_epoch=1.240]        
Epoch 40: 100%|██████████| 1/1 [00:00<00:00, 49.68it/s, v_num=0, train_loss_step=1.080, train_loss_epoch=1.210]
Epoch 46:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.260, train_loss_epoch=1.260]        
Epoch 52:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.120, train_loss_epoch=1.120] 

[2m[36m(train_tune pid=701377)[0m Global seed set to 19


Epoch 9:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.630, train_loss_epoch=1.630]         
Epoch 15:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.310, train_loss_epoch=1.310]        
Epoch 20:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.230, train_loss_epoch=1.230]         
Epoch 20: 100%|██████████| 1/1 [00:00<00:00, 70.75it/s, v_num=0, train_loss_step=0.808, train_loss_epoch=1.230]
Epoch 25: 100%|██████████| 1/1 [00:00<00:00, 47.57it/s, v_num=0, train_loss_step=0.855, train_loss_epoch=0.881]
Epoch 26:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.855, train_loss_epoch=0.855]        
Epoch 31:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.749, train_loss_epoch=0.749]        
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.523, train_loss_epoch=0.523]         
Epoch 42:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.712, train_loss_epoch=0.712

[2m[36m(train_tune pid=701377)[0m Global seed set to 14


Epoch 28:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.130, train_loss_epoch=1.130]         
Epoch 41: 100%|██████████| 1/1 [00:00<00:00, 162.93it/s, v_num=0, train_loss_step=1.620, train_loss_epoch=1.620]
Epoch 42:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.620, train_loss_epoch=1.620]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.814, train_loss_epoch=0.814]         
Epoch 55:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.740, train_loss_epoch=1.740]         
Epoch 68:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.711, train_loss_epoch=0.711]         
Epoch 81:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.741, train_loss_epoch=0.741]         
Epoch 94:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.407, train_loss_epoch=0.407]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 165.89it/s, v_num=0, train_loss_step=1.250, train_l

[2m[36m(train_tune pid=701377)[0m Global seed set to 9


Epoch 19: 100%|██████████| 1/1 [00:00<00:00, 101.82it/s, v_num=0, train_loss_step=0.713, train_loss_epoch=0.713]
Epoch 20:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.713, train_loss_epoch=0.713]         
Epoch 32:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.470, train_loss_epoch=0.470]         
Epoch 45:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.615, train_loss_epoch=0.615]         
Epoch 57:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.320, train_loss_epoch=1.320]         
Epoch 69: 100%|██████████| 1/1 [00:00<00:00, 154.77it/s, v_num=0, train_loss_step=1.040, train_loss_epoch=1.120]
Epoch 70:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.040, train_loss_epoch=1.040]         
Epoch 82:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.332, train_loss_epoch=0.332]         
Epoch 95:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.216, train_loss_epoch

[2m[36m(train_tune pid=701377)[0m Global seed set to 7


Epoch 18: 100%|██████████| 1/1 [00:00<00:00, 168.94it/s, v_num=0, train_loss_step=486.0, train_loss_epoch=128.0]
Epoch 19:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=486.0, train_loss_epoch=486.0]         
Epoch 31:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=45.80, train_loss_epoch=45.80]             
Epoch 43:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=52.40, train_loss_epoch=52.40]         
Epoch 55:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=35.70, train_loss_epoch=35.70]             
Epoch 56:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=204.0, train_loss_epoch=204.0]         
Epoch 67: 100%|██████████| 1/1 [00:00<00:00, 140.65it/s, v_num=0, train_loss_step=16.00, train_loss_epoch=48.70]  
Epoch 68:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=16.00, train_loss_epoch=16.00]         
Epoch 80:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.73e+3, trai

[2m[36m(train_tune pid=701377)[0m Global seed set to 17


Epoch 4:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.080, train_loss_epoch=1.080]         
Epoch 16: 100%|██████████| 1/1 [00:00<00:00, 106.91it/s, v_num=0, train_loss_step=3.380, train_loss_epoch=3.380]
Epoch 17:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.380, train_loss_epoch=3.380]         
Epoch 30:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.050, train_loss_epoch=1.050]         
Epoch 42: 100%|██████████| 1/1 [00:00<00:00, 182.38it/s, v_num=0, train_loss_step=1.100, train_loss_epoch=1.120]
Epoch 43:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.100, train_loss_epoch=1.100]         
Epoch 56:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.757, train_loss_epoch=0.757]         
Epoch 69:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.461, train_loss_epoch=0.461]         
Epoch 82:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.573, train_loss_epoch=

[2m[36m(train_tune pid=701377)[0m Global seed set to 5


Epoch 13:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=39.40, train_loss_epoch=39.40]         
Epoch 23:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=63.80, train_loss_epoch=63.80]         
Epoch 23: 100%|██████████| 1/1 [00:00<00:00, 180.58it/s, v_num=0, train_loss_step=63.80, train_loss_epoch=63.80]
Epoch 24:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=16.70, train_loss_epoch=16.70]         
Epoch 36:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=60.30, train_loss_epoch=60.30]         
Epoch 48:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=93.60, train_loss_epoch=93.60]         
Epoch 60:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=24.50, train_loss_epoch=24.50]         
Epoch 72: 100%|██████████| 1/1 [00:00<00:00, 157.50it/s, v_num=0, train_loss_step=610.0, train_loss_epoch=360.0]  
Epoch 73:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=610.0, train_loss_epo

[2m[36m(train_tune pid=701377)[0m Global seed set to 8


Epoch 3: 100%|██████████| 1/1 [00:00<00:00, 134.21it/s, v_num=0, train_loss_step=0.915, train_loss_epoch=0.915]
Epoch 4:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.915, train_loss_epoch=0.915]         
Epoch 15:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.791, train_loss_epoch=0.791]         
Epoch 27:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.700, train_loss_epoch=1.700]         
Epoch 38:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.866, train_loss_epoch=0.866]         
Epoch 50:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.570, train_loss_epoch=1.570]         
Epoch 61: 100%|██████████| 1/1 [00:00<00:00, 87.08it/s, v_num=0, train_loss_step=1.100, train_loss_epoch=0.778] 
Epoch 62:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.100, train_loss_epoch=1.100]        
Epoch 74:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.497, train_loss_epoch=0.

[2m[36m(train_tune pid=701377)[0m Global seed set to 2


Epoch 16: 100%|██████████| 1/1 [00:00<00:00, 88.85it/s, v_num=0, train_loss_step=1.040, train_loss_epoch=1.440] 
Epoch 17:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.040, train_loss_epoch=1.040]        
Epoch 29:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.280, train_loss_epoch=1.280]         
Epoch 40:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.726, train_loss_epoch=0.726]         
Epoch 52:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.867, train_loss_epoch=0.867]         
Epoch 64:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.704, train_loss_epoch=0.704]         
Epoch 76:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.884, train_loss_epoch=0.884]         
Epoch 88:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.519, train_loss_epoch=0.519]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 90.01it/s, v_num=0, train_loss_step=0.714, train_los

[2m[36m(train_tune pid=701377)[0m Global seed set to 16


Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.340, train_loss_epoch=1.340]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.170, train_loss_epoch=1.170]         
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.698, train_loss_epoch=0.698]         
Epoch 71: 100%|██████████| 1/1 [00:00<00:00, 195.29it/s, v_num=0, train_loss_step=5.740, train_loss_epoch=0.698]
Epoch 72:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.740, train_loss_epoch=5.740]         
Epoch 89:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.656, train_loss_epoch=0.656]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 195.52it/s, v_num=0, train_loss_step=0.735, train_loss_epoch=0.670]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 87.09it

[2m[36m(train_tune pid=701377)[0m Global seed set to 1


Epoch 28:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.580, train_loss_epoch=2.580]         
Epoch 46:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=9.190, train_loss_epoch=9.190]         
Epoch 63:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.100, train_loss_epoch=5.100]         
Epoch 80: 100%|██████████| 1/1 [00:00<00:00, 199.94it/s, v_num=0, train_loss_step=187.0, train_loss_epoch=1.960]
Epoch 81:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=187.0, train_loss_epoch=187.0]         
Epoch 98:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=6.080, train_loss_epoch=6.080]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 199.03it/s, v_num=0, train_loss_step=6.010, train_loss_epoch=7.670]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 87.27it

[2m[36m(train_tune pid=701377)[0m Global seed set to 2


Epoch 17:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.180, train_loss_epoch=5.180]         
Epoch 34:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=30.80, train_loss_epoch=30.80]         
Epoch 51:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=11.90, train_loss_epoch=11.90]         
Epoch 67: 100%|██████████| 1/1 [00:00<00:00, 177.91it/s, v_num=0, train_loss_step=4.860, train_loss_epoch=4.860]
Epoch 68:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.860, train_loss_epoch=4.860]         
Epoch 85:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.710, train_loss_epoch=5.710]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 190.92it/s, v_num=0, train_loss_step=8.590, train_loss_epoch=8.480]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 68.38it

[2m[36m(train_tune pid=701377)[0m Global seed set to 8


Epoch 31:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.280, train_loss_epoch=1.280]         
Epoch 47:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.430, train_loss_epoch=1.430]         
Epoch 62:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.544, train_loss_epoch=0.544]         
Epoch 63:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.519, train_loss_epoch=0.519]         
Epoch 78:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.664, train_loss_epoch=0.664]         
Epoch 78: 100%|██████████| 1/1 [00:00<00:00, 164.19it/s, v_num=0, train_loss_step=1.220, train_loss_epoch=1.220]
Epoch 79:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.220, train_loss_epoch=1.220]         
Epoch 94: 100%|██████████| 1/1 [00:00<00:00, 178.67it/s, v_num=0, train_loss_step=0.585, train_loss_epoch=0.918]
Epoch 95:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.585, train_loss_epoch

[2m[36m(train_tune pid=701377)[0m Global seed set to 17


Epoch 18:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.010, train_loss_epoch=1.010]         
Epoch 35: 100%|██████████| 1/1 [00:00<00:00, 189.86it/s, v_num=0, train_loss_step=1.370, train_loss_epoch=1.370]
Epoch 36:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.370, train_loss_epoch=1.370]         
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.930, train_loss_epoch=1.930]         
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.624, train_loss_epoch=0.624]         
Epoch 88:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.170, train_loss_epoch=2.170]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 201.76it/s, v_num=0, train_loss_step=1.590, train_loss_epoch=1.340]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 89.70it

[2m[36m(train_tune pid=701377)[0m Global seed set to 8


Epoch 15:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.510, train_loss_epoch=3.510]         
Epoch 31:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=20.30, train_loss_epoch=20.30]         
Epoch 31: 100%|██████████| 1/1 [00:00<00:00, 175.74it/s, v_num=0, train_loss_step=17.50, train_loss_epoch=17.50]
Epoch 32:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=17.50, train_loss_epoch=17.50]         
Epoch 49:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=16.00, train_loss_epoch=16.00]         
Epoch 66:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.850, train_loss_epoch=4.850]         
Epoch 83:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.100, train_loss_epoch=4.100]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 194.60it/s, v_num=0, train_loss_step=41.50, train_loss_epoch=11.20]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=701377)[0m Global seed set to 12


Epoch 32:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.710, train_loss_epoch=0.710]         
Epoch 32: 100%|██████████| 1/1 [00:00<00:00, 200.78it/s, v_num=0, train_loss_step=7.510, train_loss_epoch=0.710]
Epoch 33:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=7.510, train_loss_epoch=7.510]         
Epoch 50:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.778, train_loss_epoch=0.778]         
Epoch 67: 100%|██████████| 1/1 [00:00<00:00, 189.38it/s, v_num=0, train_loss_step=0.928, train_loss_epoch=0.928]
Epoch 68:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.928, train_loss_epoch=0.928]         
Epoch 85:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.646, train_loss_epoch=0.646]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 192.26it/s, v_num=0, train_loss_step=0.552, train_loss_epoch=0.969]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=701377)[0m Global seed set to 1


Epoch 23:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.464, train_loss_epoch=0.464]         
Epoch 40:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.500, train_loss_epoch=1.500]         
Epoch 56:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.860, train_loss_epoch=1.860]         
Epoch 56: 100%|██████████| 1/1 [00:00<00:00, 180.07it/s, v_num=0, train_loss_step=3.210, train_loss_epoch=3.210]
Epoch 57:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.210, train_loss_epoch=3.210]         
Epoch 73:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.573, train_loss_epoch=0.573]         
Epoch 73: 100%|██████████| 1/1 [00:00<00:00, 177.91it/s, v_num=0, train_loss_step=0.716, train_loss_epoch=0.716]
Epoch 74:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.716, train_loss_epoch=0.716]         
Epoch 90:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.542, train_loss_epoch

[2m[36m(train_tune pid=701377)[0m Global seed set to 6


Epoch 28:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.920, train_loss_epoch=2.920]         
Epoch 45:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.280, train_loss_epoch=5.280]         
Epoch 62:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=31.20, train_loss_epoch=31.20]         
Epoch 79:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=34.00, train_loss_epoch=34.00]         
Epoch 96:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=8.130, train_loss_epoch=8.130]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 190.76it/s, v_num=0, train_loss_step=952.0, train_loss_epoch=121.0]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 85.69it/s, v_num=0, train_loss_step=952.0, train_loss_epoch=121.0, valid_loss=18.40]
Epoch 111:   0%|          | 0/1 [00

[2m[36m(train_tune pid=701377)[0m Global seed set to 12


Epoch 14:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.705, train_loss_epoch=0.705]         
Epoch 31:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.200, train_loss_epoch=1.200]         
Epoch 48:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.060, train_loss_epoch=1.060]         
Epoch 65:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.554, train_loss_epoch=0.554]         
Epoch 65: 100%|██████████| 1/1 [00:00<00:00, 193.95it/s, v_num=0, train_loss_step=1.190, train_loss_epoch=0.554]
Epoch 66:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.190, train_loss_epoch=1.190]         
Epoch 83:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.678, train_loss_epoch=0.678]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 190.89it/s, v_num=0, train_loss_step=0.701, train_loss_epoch=0.944]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=701377)[0m Global seed set to 8


Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.647, train_loss_epoch=0.647]         
Epoch 37: 100%|██████████| 1/1 [00:00<00:00, 181.78it/s, v_num=0, train_loss_step=0.666, train_loss_epoch=0.666]
Epoch 38:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.666, train_loss_epoch=0.666]         
Epoch 55:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.993, train_loss_epoch=0.993]         
Epoch 72:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.318, train_loss_epoch=0.318]         
Epoch 89:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.842, train_loss_epoch=0.842]         
Epoch 89: 100%|██████████| 1/1 [00:00<00:00, 184.32it/s, v_num=0, train_loss_step=0.990, train_loss_epoch=0.990]
Epoch 90:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.990, train_loss_epoch=0.990]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 195.17it/s, v_num=0, train_loss_step=0.630, train_l

[2m[36m(train_tune pid=701377)[0m Global seed set to 11


Epoch 13:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.090, train_loss_epoch=1.090]         
Epoch 13: 100%|██████████| 1/1 [00:00<00:00, 191.64it/s, v_num=0, train_loss_step=1.440, train_loss_epoch=1.090]
Epoch 14:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.440, train_loss_epoch=1.440]         
Epoch 30: 100%|██████████| 1/1 [00:00<00:00, 180.98it/s, v_num=0, train_loss_step=1.500, train_loss_epoch=1.500]
Epoch 31:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.500, train_loss_epoch=1.500]         
Epoch 48:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.070, train_loss_epoch=1.070]         
Epoch 64: 100%|██████████| 1/1 [00:00<00:00, 177.72it/s, v_num=0, train_loss_step=0.726, train_loss_epoch=0.726]
Epoch 65:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.726, train_loss_epoch=0.726]         
Epoch 81:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.977, train_loss_epoch

[2m[36m(train_tune pid=701377)[0m Global seed set to 1


Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.030, train_loss_epoch=4.030]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.410, train_loss_epoch=2.410]         
Epoch 54: 100%|██████████| 1/1 [00:00<00:00, 201.27it/s, v_num=0, train_loss_step=1.990, train_loss_epoch=2.410]
Epoch 55:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.990, train_loss_epoch=1.990]         
Epoch 72:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.804, train_loss_epoch=0.804]         
Epoch 72: 100%|██████████| 1/1 [00:00<00:00, 202.71it/s, v_num=0, train_loss_step=0.895, train_loss_epoch=0.804]
Epoch 73:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.895, train_loss_epoch=0.895]         
Epoch 90:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.410, train_loss_epoch=5.410]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 201.12it/s, v_num=0, train_loss_step=137.0, train_l

Global seed set to 17


Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 193.98it/s, v_num=0, train_loss_step=1.030, train_loss_epoch=0.647, valid_loss=0.561]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 86.83it/s, v_num=0, train_loss_step=1.030, train_loss_epoch=0.647, valid_loss=0.893] 
Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 66.91it/s, v_num=0, train_loss_step=1.030, train_loss_epoch=1.030, valid_loss=0.893]


Sanity Checking: 0it [00:00, ?it/s]

Training: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

IOPub message rate exceeded.
The Jupyter server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--ServerApp.iopub_msg_rate_limit`.

Current values:
ServerApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
ServerApp.rate_limit_window=3.0 (secs)

[2m[36m(pid=709027)[0m   warn(f"Failed to load image Python extension: {e}")
[2m[36m(train_tune pid=709027)[0m Global seed set to 8
[2m[36m(train_tune pid=709027)[0m --------------------------------------------------------------------------
[2m[36m(train_tune pid=709027)[0m detected:
[2m[36m(train_tune pid=709027)[0m 
[2m[36m(train_tune pid=709027)[0m   Local host:            152-67-225-75
[2m[36m(train_tune pid=709027)[0m   Device name:           mlx5_0
[2m[36m(train_tune pid=709027)[0m   Device vendor ID:      0x02c9
[2m[36m(train_tune pid=709027)[0m   Device vendor part ID: 4126
[2m[36m(train_tune pid=709027)[0m 
[2m[36m(train_tune pid=709

Epoch 0:   0%|          | 0/1 [00:00<?, ?it/s]                             
Epoch 11:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.765, train_loss_epoch=0.765]         
Epoch 11: 100%|██████████| 1/1 [00:00<00:00, 170.96it/s, v_num=0, train_loss_step=2.790, train_loss_epoch=2.790]
Epoch 12:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.790, train_loss_epoch=2.790]         
Epoch 28:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.741, train_loss_epoch=0.741]         
Epoch 44:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.100, train_loss_epoch=1.100]         
Epoch 59: 100%|██████████| 1/1 [00:00<00:00, 169.18it/s, v_num=0, train_loss_step=1.340, train_loss_epoch=1.340]
Epoch 60:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.340, train_loss_epoch=1.340]         
Epoch 76:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=8.540, train_loss_epoch=8.540]         
Epoch 91: 100%|█████

[2m[36m(train_tune pid=709027)[0m Global seed set to 2


Epoch 2:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.930, train_loss_epoch=1.930]         
Epoch 2: 100%|██████████| 1/1 [00:00<00:00, 174.77it/s, v_num=0, train_loss_step=2.240, train_loss_epoch=2.240]
Epoch 3:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.240, train_loss_epoch=2.240]         
Epoch 19:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.130, train_loss_epoch=1.130]         
Epoch 19: 100%|██████████| 1/1 [00:00<00:00, 177.36it/s, v_num=0, train_loss_step=2.310, train_loss_epoch=2.310]
Epoch 20:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.310, train_loss_epoch=2.310]         
Epoch 36:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.190, train_loss_epoch=1.190]         
Epoch 36: 100%|██████████| 1/1 [00:00<00:00, 178.66it/s, v_num=0, train_loss_step=1.960, train_loss_epoch=1.960]
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.960, train_loss_epoch=1.

[2m[36m(train_tune pid=709027)[0m Global seed set to 18


Epoch 30:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.360, train_loss_epoch=1.360]         
Epoch 46: 100%|██████████| 1/1 [00:00<00:00, 179.55it/s, v_num=0, train_loss_step=1.570, train_loss_epoch=1.570]
Epoch 47:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.570, train_loss_epoch=1.570]         
Epoch 63: 100%|██████████| 1/1 [00:00<00:00, 177.63it/s, v_num=0, train_loss_step=1.280, train_loss_epoch=1.280]
Epoch 64:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.280, train_loss_epoch=1.280]         
Epoch 80: 100%|██████████| 1/1 [00:00<00:00, 180.99it/s, v_num=0, train_loss_step=1.810, train_loss_epoch=1.810]
Epoch 81:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.810, train_loss_epoch=1.810]         
Epoch 97: 100%|██████████| 1/1 [00:00<00:00, 180.27it/s, v_num=0, train_loss_step=0.595, train_loss_epoch=0.595]
Epoch 98:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.595, train_loss_epoch

[2m[36m(train_tune pid=709027)[0m Global seed set to 15


Epoch 16:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.700, train_loss_epoch=1.700]         
Epoch 32:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.470, train_loss_epoch=1.470]         
Epoch 32: 100%|██████████| 1/1 [00:00<00:00, 175.75it/s, v_num=0, train_loss_step=1.660, train_loss_epoch=1.660]
Epoch 32:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.660, train_loss_epoch=1.660]         
Epoch 33:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.660, train_loss_epoch=1.660]
Epoch 49:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.801, train_loss_epoch=0.801]         
Epoch 65:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.993, train_loss_epoch=0.993]         
Epoch 82:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.030, train_loss_epoch=1.030]         
Epoch 98:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.790, train_loss_epoch=0.790]  

[2m[36m(train_tune pid=709027)[0m Global seed set to 5


Epoch 32:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=12.40, train_loss_epoch=12.40]         
Epoch 49:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=8.170, train_loss_epoch=8.170]         
Epoch 66:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=30.30, train_loss_epoch=30.30]             
Epoch 82:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.040, train_loss_epoch=5.040]         
Epoch 83:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.040, train_loss_epoch=5.040]
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 193.03it/s, v_num=0, train_loss_step=1.760, train_loss_epoch=2.420]    
[2m[36m(train_tune pid=709027)[0m 
Validation: 0it [00:00, ?it/s][A[0m 
[2m[36m(train_tune pid=709027)[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
[2m[36m(train_tune pid=709027)[0m 
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 87.77it

[2m[36m(train_tune pid=709027)[0m Global seed set to 19


Epoch 19: 100%|██████████| 1/1 [00:00<00:00, 197.12it/s, v_num=0, train_loss_step=0.545, train_loss_epoch=0.545]
Epoch 20:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.830, train_loss_epoch=0.830]         
Epoch 36:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.684, train_loss_epoch=0.684]         
Epoch 36: 100%|██████████| 1/1 [00:00<00:00, 182.69it/s, v_num=0, train_loss_step=0.590, train_loss_epoch=0.684]
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.590, train_loss_epoch=0.590]         
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.400, train_loss_epoch=1.400]         
Epoch 53: 100%|██████████| 1/1 [00:00<00:00, 176.75it/s, v_num=0, train_loss_step=0.972, train_loss_epoch=0.972]
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.972, train_loss_epoch=0.972]         
Epoch 70:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.643, train_loss_epoch

[2m[36m(train_tune pid=709027)[0m Global seed set to 8


Epoch 16: 100%|██████████| 1/1 [00:00<00:00, 181.39it/s, v_num=0, train_loss_step=1.160, train_loss_epoch=1.160]
Epoch 17:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.160, train_loss_epoch=1.160]         
Epoch 34:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.774, train_loss_epoch=0.774]         
Epoch 50:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.593, train_loss_epoch=0.593]         
Epoch 51:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.568, train_loss_epoch=0.568]         
Epoch 67: 100%|██████████| 1/1 [00:00<00:00, 179.68it/s, v_num=0, train_loss_step=0.808, train_loss_epoch=0.808]
Epoch 68:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.808, train_loss_epoch=0.808]         
Epoch 85:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.252, train_loss_epoch=0.252]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 192.87it/s, v_num=0, train_loss_step=0.764, train_l

[2m[36m(train_tune pid=709027)[0m Global seed set to 14


Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.170, train_loss_epoch=1.170]         
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.300, train_loss_epoch=1.300]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.598, train_loss_epoch=0.598]         
Epoch 70: 100%|██████████| 1/1 [00:00<00:00, 190.32it/s, v_num=0, train_loss_step=0.977, train_loss_epoch=1.900]
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.977, train_loss_epoch=0.977]         
Epoch 87: 100%|██████████| 1/1 [00:00<00:00, 191.80it/s, v_num=0, train_loss_step=1.120, train_loss_epoch=0.729]
Epoch 88:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.120, train_loss_epoch=1.120]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 189.77it/s, v_num=0, train_loss_step=1.020, train_loss_epoch=0.772]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=709027)[0m Global seed set to 3


Epoch 31:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.370, train_loss_epoch=1.370]         
Epoch 46: 100%|██████████| 1/1 [00:00<00:00, 174.38it/s, v_num=0, train_loss_step=1.960, train_loss_epoch=0.447]
Epoch 47:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.960, train_loss_epoch=1.960]         
Epoch 62:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.906, train_loss_epoch=0.906]           
Epoch 62:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.976, train_loss_epoch=0.976]         
Epoch 63:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.976, train_loss_epoch=0.976]
Epoch 78:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.760, train_loss_epoch=1.760]         
Epoch 79:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.190, train_loss_epoch=4.190]         
Epoch 94:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.530, train_loss_epoch=2.530]

[2m[36m(train_tune pid=709027)[0m Global seed set to 5


Epoch 5:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.060, train_loss_epoch=2.060]         
Epoch 21:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=7.540, train_loss_epoch=7.540]         
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=39.40, train_loss_epoch=39.40]         
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=23.70, train_loss_epoch=23.70]         
Epoch 69:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=6.66e+3, train_loss_epoch=6.66e+3]         
Epoch 85:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=13.50, train_loss_epoch=13.50]             
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 181.59it/s, v_num=0, train_loss_step=0.985, train_loss_epoch=1.140]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0: 100%|██████████| 1/1

[2m[36m(train_tune pid=709027)[0m Global seed set to 7


Epoch 26:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.400, train_loss_epoch=2.400]         
Epoch 42: 100%|██████████| 1/1 [00:00<00:00, 183.98it/s, v_num=0, train_loss_step=0.963, train_loss_epoch=1.130]
Epoch 43:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.963, train_loss_epoch=0.963]         
Epoch 59:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.890, train_loss_epoch=1.890]         
Epoch 75:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.330, train_loss_epoch=1.330]         
Epoch 75: 100%|██████████| 1/1 [00:00<00:00, 175.00it/s, v_num=0, train_loss_step=1.080, train_loss_epoch=1.080]
Epoch 76:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.080, train_loss_epoch=1.080]         
Epoch 92:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.927, train_loss_epoch=0.927]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 184.69it/s, v_num=0, train_loss_step=0.719, train_l

[2m[36m(train_tune pid=709027)[0m Global seed set to 3


Epoch 16:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.295, train_loss_epoch=0.295]         
Epoch 33:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.500, train_loss_epoch=1.500]         
Epoch 49: 100%|██████████| 1/1 [00:00<00:00, 187.13it/s, v_num=0, train_loss_step=1.220, train_loss_epoch=0.613]
Epoch 50:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.220, train_loss_epoch=1.220]         
Epoch 66:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.547, train_loss_epoch=0.547]         
Epoch 83:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.919, train_loss_epoch=0.919]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 188.85it/s, v_num=0, train_loss_step=0.541, train_loss_epoch=0.393]
[2m[36m(train_tune pid=709027)[0m 
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%

[2m[36m(train_tune pid=709027)[0m Global seed set to 19


Epoch 26:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.330, train_loss_epoch=1.330]         
Epoch 27:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.350, train_loss_epoch=1.350]         
Epoch 42:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.490, train_loss_epoch=1.490]         
Epoch 57: 100%|██████████| 1/1 [00:00<00:00, 165.84it/s, v_num=0, train_loss_step=0.658, train_loss_epoch=0.658]
Epoch 58:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.658, train_loss_epoch=0.658]         
Epoch 73:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.070, train_loss_epoch=1.070]         
Epoch 73: 100%|██████████| 1/1 [00:00<00:00, 181.70it/s, v_num=0, train_loss_step=1.070, train_loss_epoch=1.070]
Epoch 74:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.939, train_loss_epoch=0.939]         
Epoch 89:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.460, train_loss_epoch

[2m[36m(train_tune pid=709027)[0m Global seed set to 8


Epoch 20:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.070, train_loss_epoch=1.070]         
Epoch 21:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.400, train_loss_epoch=3.400]         
Epoch 38:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.100, train_loss_epoch=1.100]         
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.987, train_loss_epoch=0.987]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.987, train_loss_epoch=0.987]
Epoch 65:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.940, train_loss_epoch=1.940]         
Epoch 76:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=8.770, train_loss_epoch=8.770]         
Epoch 91:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.457, train_loss_epoch=0.457]         
Epoch 92:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.457, train_loss_epoch=0.457]
E

[2m[36m(train_tune pid=709027)[0m Global seed set to 8


Epoch 3:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.656, train_loss_epoch=0.656]         
Epoch 20:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.692, train_loss_epoch=0.692]         
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.448, train_loss_epoch=0.448]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.598, train_loss_epoch=0.598]         
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.777, train_loss_epoch=0.777]         
Epoch 88:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.426, train_loss_epoch=0.426]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 191.75it/s, v_num=0, train_loss_step=0.566, train_loss_epoch=0.182]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 74.26it/

[2m[36m(train_tune pid=709027)[0m Global seed set to 19


Epoch 35:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.080, train_loss_epoch=1.080]         
Epoch 52: 100%|██████████| 1/1 [00:00<00:00, 199.86it/s, v_num=0, train_loss_step=0.955, train_loss_epoch=0.531]
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.955, train_loss_epoch=0.955]         
Epoch 70:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=16.00, train_loss_epoch=16.00]         
Epoch 88:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.901, train_loss_epoch=0.901]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 198.66it/s, v_num=0, train_loss_step=0.381, train_loss_epoch=0.454]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 86.53it/s, v_num=0, train_loss_step=0.381, train_loss_epoch=0.454, valid_loss=0.182]
Epoch 103:   0%|          | 0/1 [00

[2m[36m(train_tune pid=709027)[0m Global seed set to 15


Epoch 21:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=92.90, train_loss_epoch=92.90]         
Epoch 21: 100%|██████████| 1/1 [00:00<00:00, 173.98it/s, v_num=0, train_loss_step=1.500, train_loss_epoch=92.90]
Epoch 22:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.500, train_loss_epoch=1.500]         
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.710, train_loss_epoch=1.710]         
Epoch 52:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=103.0, train_loss_epoch=103.0]             
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=103.0, train_loss_epoch=103.0]
Epoch 68:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.650, train_loss_epoch=3.650]         
Epoch 68: 100%|██████████| 1/1 [00:00<00:00, 175.30it/s, v_num=0, train_loss_step=2.920, train_loss_epoch=3.650]
Epoch 69:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.920, train_loss_epoch=2.92

[2m[36m(train_tune pid=709027)[0m Global seed set to 18


Epoch 10: 100%|██████████| 1/1 [00:00<00:00, 168.46it/s, v_num=0, train_loss_step=1.050, train_loss_epoch=1.050]
Epoch 11:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.050, train_loss_epoch=1.050]         
Epoch 27:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.000, train_loss_epoch=4.000]         
Epoch 43:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.710, train_loss_epoch=3.710]         
Epoch 59:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=38.90, train_loss_epoch=38.90]         
Epoch 74: 100%|██████████| 1/1 [00:00<00:00, 168.43it/s, v_num=0, train_loss_step=1.020, train_loss_epoch=1.020]
Epoch 75:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.020, train_loss_epoch=1.020]         
Epoch 90:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.880, train_loss_epoch=3.880]         
Epoch 90: 100%|██████████| 1/1 [00:00<00:00, 178.61it/s, v_num=0, train_loss_step=2.160, train_l

[2m[36m(train_tune pid=709027)[0m Global seed set to 11


Epoch 4: 100%|██████████| 1/1 [00:00<00:00, 171.32it/s, v_num=0, train_loss_step=2.590, train_loss_epoch=2.590]
Epoch 5:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.590, train_loss_epoch=2.590]         
Epoch 21:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.381, train_loss_epoch=0.381]         
Epoch 21: 100%|██████████| 1/1 [00:00<00:00, 182.96it/s, v_num=0, train_loss_step=0.954, train_loss_epoch=0.381]
Epoch 22:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.954, train_loss_epoch=0.954]         
Epoch 38:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.840, train_loss_epoch=1.840]         
Epoch 55:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.602, train_loss_epoch=0.602]         
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.595, train_loss_epoch=0.595]         
Epoch 71: 100%|██████████| 1/1 [00:00<00:00, 182.49it/s, v_num=0, train_loss_step=0.791, train_los

[2m[36m(train_tune pid=709027)[0m Global seed set to 11


Epoch 11:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=7.420, train_loss_epoch=7.420]         
Epoch 11: 100%|██████████| 1/1 [00:00<00:00, 177.69it/s, v_num=0, train_loss_step=12.60, train_loss_epoch=12.60]
Epoch 12:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=12.60, train_loss_epoch=12.60]         
Epoch 28:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.270, train_loss_epoch=2.270]         
Epoch 28: 100%|██████████| 1/1 [00:00<00:00, 183.87it/s, v_num=0, train_loss_step=3.390, train_loss_epoch=2.270]
Epoch 29:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.390, train_loss_epoch=3.390]         
Epoch 45:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.020, train_loss_epoch=5.020]         
Epoch 62:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=6.240, train_loss_epoch=6.240]         
Epoch 78:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=10.10, train_loss_epoch

[2m[36m(train_tune pid=709027)[0m Global seed set to 13


Epoch 9:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.907, train_loss_epoch=0.907]         
Epoch 26:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.100, train_loss_epoch=1.100]         
Epoch 43: 100%|██████████| 1/1 [00:00<00:00, 187.56it/s, v_num=0, train_loss_step=1.000, train_loss_epoch=1.000]
Epoch 44:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.000, train_loss_epoch=1.000]         
Epoch 61:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.631, train_loss_epoch=0.631]         
Epoch 78: 100%|██████████| 1/1 [00:00<00:00, 185.08it/s, v_num=0, train_loss_step=1.350, train_loss_epoch=1.350]
Epoch 79:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.350, train_loss_epoch=1.350]         
Epoch 96:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.300, train_loss_epoch=1.300]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 198.25it/s, v_num=0, train_loss_step=4.750, train_lo

[2m[36m(train_tune pid=709027)[0m Global seed set to 10


Epoch 21:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.480, train_loss_epoch=1.480]         
Epoch 36: 100%|██████████| 1/1 [00:00<00:00, 176.51it/s, v_num=0, train_loss_step=0.622, train_loss_epoch=1.090]
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.622, train_loss_epoch=0.622]         
Epoch 52:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.784, train_loss_epoch=0.784]         
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.761, train_loss_epoch=0.761]         
Epoch 68:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.474, train_loss_epoch=0.474]         
Epoch 68: 100%|██████████| 1/1 [00:00<00:00, 174.89it/s, v_num=0, train_loss_step=0.813, train_loss_epoch=0.474]
Epoch 69:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.813, train_loss_epoch=0.813]         
Epoch 84:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.594, train_loss_epoch

[2m[36m(train_tune pid=709027)[0m Global seed set to 11


Epoch 30:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.670, train_loss_epoch=1.670]         
Epoch 46:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.850, train_loss_epoch=3.850]         
Epoch 46: 100%|██████████| 1/1 [00:00<00:00, 171.53it/s, v_num=0, train_loss_step=1.370, train_loss_epoch=1.370]
Epoch 47:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.370, train_loss_epoch=1.370]         
Epoch 63:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.050, train_loss_epoch=1.050]             
Epoch 79:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.660, train_loss_epoch=1.660]         
Epoch 95: 100%|██████████| 1/1 [00:00<00:00, 189.25it/s, v_num=0, train_loss_step=1.460, train_loss_epoch=1.460]
Epoch 96:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=13.20, train_loss_epoch=13.20]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 184.92it/s, v_num=0, train_loss_step=6.780, tra

[2m[36m(train_tune pid=709027)[0m Global seed set to 8


Epoch 10:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.914, train_loss_epoch=0.914]        
Epoch 10: 100%|██████████| 1/1 [00:00<00:00, 171.17it/s, v_num=0, train_loss_step=1.540, train_loss_epoch=0.914]
Epoch 11:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.540, train_loss_epoch=1.540]         
Epoch 26:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.000, train_loss_epoch=1.000]         
Epoch 41:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.405, train_loss_epoch=0.405]         
Epoch 56:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.856, train_loss_epoch=0.856]         
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.230, train_loss_epoch=1.230]         
Epoch 86:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.491, train_loss_epoch=0.491]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 165.25it/s, v_num=0, train_loss_step=0.873, train_lo

[2m[36m(train_tune pid=709027)[0m Global seed set to 17


Epoch 35:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.000, train_loss_epoch=1.000]         
Epoch 52:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.380, train_loss_epoch=4.380]         
Epoch 69:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.380, train_loss_epoch=1.380]         
Epoch 86:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.090, train_loss_epoch=1.090]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 194.14it/s, v_num=0, train_loss_step=1.070, train_loss_epoch=1.390]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 88.24it/s, v_num=0, train_loss_step=1.070, train_loss_epoch=1.390, valid_loss=0.199]
Epoch 101:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.931, train_loss_epoch=0.931, valid_loss=0.199]         
Epoch 118:   0%|

[2m[36m(train_tune pid=709027)[0m Global seed set to 11


Epoch 19:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=10.40, train_loss_epoch=10.40]         
Epoch 35:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=9.210, train_loss_epoch=9.210]         
Epoch 50:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.490, train_loss_epoch=3.490]         
Epoch 50: 100%|██████████| 1/1 [00:00<00:00, 168.25it/s, v_num=0, train_loss_step=2.01e+4, train_loss_epoch=2.01e+4]
Epoch 51:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.01e+4, train_loss_epoch=2.01e+4]         
Epoch 66:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=8.220, train_loss_epoch=8.220]             
Epoch 66:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=14.60, train_loss_epoch=14.60]         
Epoch 67:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=14.60, train_loss_epoch=14.60]
Epoch 82: 100%|██████████| 1/1 [00:00<00:00, 183.02it/s, v_num=0, train_loss_step=1.820, trai

[2m[36m(train_tune pid=709027)[0m Global seed set to 15


Epoch 5: 100%|██████████| 1/1 [00:00<00:00, 172.88it/s, v_num=0, train_loss_step=1.020, train_loss_epoch=1.020]
Epoch 6:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.020, train_loss_epoch=1.020]         
Epoch 22:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.576, train_loss_epoch=0.576]         
Epoch 38:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.110, train_loss_epoch=2.110]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.390, train_loss_epoch=1.390]         
Epoch 55:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.640, train_loss_epoch=0.640]         
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.858, train_loss_epoch=0.858]         
Epoch 87:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.708, train_loss_epoch=0.708]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 182.19it/s, v_num=0, train_loss_step=1.060, train_los

[2m[36m(train_tune pid=709027)[0m Global seed set to 16


Epoch 7:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.240, train_loss_epoch=1.240]         
Epoch 24:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.885, train_loss_epoch=0.885]         
Epoch 41:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.928, train_loss_epoch=0.928]         
Epoch 57: 100%|██████████| 1/1 [00:00<00:00, 180.70it/s, v_num=0, train_loss_step=0.780, train_loss_epoch=0.780]
Epoch 58:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.780, train_loss_epoch=0.780]         
Epoch 75:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.640, train_loss_epoch=1.640]         
Epoch 91: 100%|██████████| 1/1 [00:00<00:00, 183.62it/s, v_num=0, train_loss_step=1.300, train_loss_epoch=1.300]
Epoch 92:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.300, train_loss_epoch=1.300]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 191.08it/s, v_num=0, train_loss_step=0.753, train_lo

[2m[36m(train_tune pid=709027)[0m Global seed set to 10


Epoch 31:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.180, train_loss_epoch=1.180]         
Epoch 47: 100%|██████████| 1/1 [00:00<00:00, 198.67it/s, v_num=0, train_loss_step=0.941, train_loss_epoch=0.941]
Epoch 48:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.909, train_loss_epoch=0.909]         
Epoch 64:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.437, train_loss_epoch=0.437]         
Epoch 64: 100%|██████████| 1/1 [00:00<00:00, 178.07it/s, v_num=0, train_loss_step=0.628, train_loss_epoch=0.628]
Epoch 65:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.628, train_loss_epoch=0.628]         
Epoch 81: 100%|██████████| 1/1 [00:00<00:00, 179.57it/s, v_num=0, train_loss_step=0.849, train_loss_epoch=0.849]
Epoch 82:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.849, train_loss_epoch=0.849]         
Epoch 98: 100%|██████████| 1/1 [00:00<00:00, 178.85it/s, v_num=0, train_loss_step=0.608, train_l

[2m[36m(train_tune pid=709027)[0m Global seed set to 16


Epoch 11:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.000, train_loss_epoch=1.000]         
Epoch 27: 100%|██████████| 1/1 [00:00<00:00, 183.77it/s, v_num=0, train_loss_step=4.720, train_loss_epoch=2.610]
Epoch 28:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.720, train_loss_epoch=4.720]         
Epoch 44:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=30.70, train_loss_epoch=30.70]         
Epoch 60:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.91e+3, train_loss_epoch=2.91e+3]         
Epoch 60: 100%|██████████| 1/1 [00:00<00:00, 191.13it/s, v_num=0, train_loss_step=2.91e+3, train_loss_epoch=2.91e+3]
Epoch 61:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=9.750, train_loss_epoch=9.750]             
Epoch 77:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.690, train_loss_epoch=4.690]             
Epoch 93:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.320, 

Global seed set to 5


Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 182.96it/s, v_num=0, train_loss_step=2.540, train_loss_epoch=2.910, valid_loss=0.178]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 68.90it/s, v_num=0, train_loss_step=2.540, train_loss_epoch=2.910, valid_loss=0.171] 
Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 52.55it/s, v_num=0, train_loss_step=2.540, train_loss_epoch=2.540, valid_loss=0.171]


Sanity Checking: 0it [00:00, ?it/s]

Training: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

IOPub message rate exceeded.
The Jupyter server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--ServerApp.iopub_msg_rate_limit`.

Current values:
ServerApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
ServerApp.rate_limit_window=3.0 (secs)

[2m[36m(pid=713766)[0m   warn(f"Failed to load image Python extension: {e}")
[2m[36m(train_tune pid=713766)[0m Global seed set to 15
[2m[36m(train_tune pid=713766)[0m --------------------------------------------------------------------------
[2m[36m(train_tune pid=713766)[0m detected:
[2m[36m(train_tune pid=713766)[0m 
[2m[36m(train_tune pid=713766)[0m   Local host:            152-67-225-75
[2m[36m(train_tune pid=713766)[0m   Device name:           mlx5_0
[2m[36m(train_tune pid=713766)[0m   Device vendor ID:      0x02c9
[2m[36m(train_tune pid=713766)[0m   Device vendor part ID: 4126
[2m[36m(train_tune pid=713766)[0m 
[2m[36m(train_tune pid=71

Sanity Checking DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s]
Epoch 5:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.874, train_loss_epoch=0.874]         
Epoch 6:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.100, train_loss_epoch=1.100]         
Epoch 22:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.323, train_loss_epoch=0.323]         
Epoch 38: 100%|██████████| 1/1 [00:00<00:00, 194.27it/s, v_num=0, train_loss_step=1.590, train_loss_epoch=1.590]
Epoch 39:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.780, train_loss_epoch=2.780]         
Epoch 55:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.955, train_loss_epoch=0.955]         
Epoch 71: 100%|██████████| 1/1 [00:00<00:00, 193.81it/s, v_num=0, train_loss_step=0.836, train_loss_epoch=0.836]
Epoch 72:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.621, train_loss_epoch=0.621]         
Epoch 88:   0%|          | 0/1

[2m[36m(train_tune pid=713766)[0m Global seed set to 7


Epoch 12:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.820, train_loss_epoch=2.820]         
Epoch 28:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.850, train_loss_epoch=1.850]         
Epoch 28: 100%|██████████| 1/1 [00:00<00:00, 174.10it/s, v_num=0, train_loss_step=41.80, train_loss_epoch=41.80]
Epoch 29:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=41.80, train_loss_epoch=41.80]         
Epoch 45:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.530, train_loss_epoch=2.530]         
Epoch 61:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.960, train_loss_epoch=1.960]         
Epoch 77:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.580, train_loss_epoch=1.580]         
Epoch 78:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.870, train_loss_epoch=1.870]         
Epoch 94:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.170, train_loss_epoch

[2m[36m(train_tune pid=713766)[0m Global seed set to 15


Epoch 23:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.020, train_loss_epoch=2.020]         
Epoch 23:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.140, train_loss_epoch=1.140]         
Epoch 24:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.140, train_loss_epoch=1.140]
Epoch 39:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.550, train_loss_epoch=1.550]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.550, train_loss_epoch=2.550]             
Epoch 55:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.350, train_loss_epoch=4.350]         
Epoch 70:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=7.690, train_loss_epoch=7.690]         
Epoch 86:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.540, train_loss_epoch=1.540]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 173.53it/s, v_num=0, train_loss_step=86.90, train_loss_e

[2m[36m(train_tune pid=713766)[0m Global seed set to 6


Epoch 19:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.783, train_loss_epoch=0.783]         
Epoch 33:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.622, train_loss_epoch=0.622]         
Epoch 34:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.040, train_loss_epoch=3.040]         
Epoch 48:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.323, train_loss_epoch=0.323]         
Epoch 62:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.325, train_loss_epoch=0.325]         
Epoch 77:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.531, train_loss_epoch=0.531]         
Epoch 91:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.496, train_loss_epoch=0.496]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 159.94it/s, v_num=0, train_loss_step=0.632, train_loss_epoch=0.385]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=713766)[0m Global seed set to 7


Epoch 20:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.386, train_loss_epoch=0.386]         
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.758, train_loss_epoch=0.758]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.610, train_loss_epoch=0.610]         
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.603, train_loss_epoch=0.603]         
Epoch 88:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.140, train_loss_epoch=1.140]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 192.55it/s, v_num=0, train_loss_step=0.985, train_loss_epoch=0.837]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 86.62it/s, v_num=0, train_loss_step=0.985, train_loss_epoch=0.837, valid_loss=0.265]
Epoch 103:   0%|          | 0/1 [00

[2m[36m(train_tune pid=713766)[0m Global seed set to 5


Epoch 17:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.080, train_loss_epoch=2.080]         
Epoch 18:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.080, train_loss_epoch=2.080]
Epoch 33:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.300, train_loss_epoch=1.300]         
Epoch 48: 100%|██████████| 1/1 [00:00<00:00, 163.54it/s, v_num=0, train_loss_step=0.855, train_loss_epoch=0.855]
Epoch 49:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.855, train_loss_epoch=0.855]         
Epoch 64:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=15.10, train_loss_epoch=15.10]         
Epoch 79: 100%|██████████| 1/1 [00:00<00:00, 164.09it/s, v_num=0, train_loss_step=0.546, train_loss_epoch=0.546]
Epoch 80:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.546, train_loss_epoch=0.546]         
Epoch 95:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.428, train_loss_epoch=0.428]  

[2m[36m(train_tune pid=713766)[0m Global seed set to 4


Epoch 36:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.670, train_loss_epoch=1.670]         
Epoch 36: 100%|██████████| 1/1 [00:00<00:00, 188.59it/s, v_num=0, train_loss_step=0.954, train_loss_epoch=1.670]
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.954, train_loss_epoch=0.954]         
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.310, train_loss_epoch=1.310]         
Epoch 70:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=52.10, train_loss_epoch=52.10]         
Epoch 86:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.120, train_loss_epoch=2.120]         
Epoch 87:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.710, train_loss_epoch=3.710]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 189.64it/s, v_num=0, train_loss_step=1.500, train_loss_epoch=1.630]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=713766)[0m Global seed set to 14


Epoch 9: 100%|██████████| 1/1 [00:00<00:00, 168.26it/s, v_num=0, train_loss_step=1.110, train_loss_epoch=1.110]
Epoch 10:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.110, train_loss_epoch=1.110]        
Epoch 26:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.657, train_loss_epoch=0.657]         
Epoch 42:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.983, train_loss_epoch=0.983]         
Epoch 58:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.648, train_loss_epoch=0.648]         
Epoch 74:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.452, train_loss_epoch=0.452]         
Epoch 90:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.862, train_loss_epoch=0.862]         
Epoch 90: 100%|██████████| 1/1 [00:00<00:00, 186.05it/s, v_num=0, train_loss_step=0.862, train_loss_epoch=0.862]
Epoch 91:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.536, train_loss_epoch=0

[2m[36m(train_tune pid=713766)[0m Global seed set to 15


Epoch 36:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=62.30, train_loss_epoch=62.30]             
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=137.0, train_loss_epoch=137.0]             
Epoch 53: 100%|██████████| 1/1 [00:00<00:00, 196.13it/s, v_num=0, train_loss_step=662.0, train_loss_epoch=137.0]
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=662.0, train_loss_epoch=662.0]         
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=450.0, train_loss_epoch=450.0]             
Epoch 88:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=581.0, train_loss_epoch=581.0]             
Epoch 88: 100%|██████████| 1/1 [00:00<00:00, 197.66it/s, v_num=0, train_loss_step=380.0, train_loss_epoch=581.0]
Epoch 89:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=380.0, train_loss_epoch=380.0]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 192.63it/s, v_num=0, train_loss_ste

[2m[36m(train_tune pid=713766)[0m Global seed set to 10


Epoch 6: 100%|██████████| 1/1 [00:00<00:00, 177.68it/s, v_num=0, train_loss_step=1.030, train_loss_epoch=1.030]
Epoch 7:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.030, train_loss_epoch=1.030]         
Epoch 23: 100%|██████████| 1/1 [00:00<00:00, 181.15it/s, v_num=0, train_loss_step=1.070, train_loss_epoch=1.070]
Epoch 23:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.070, train_loss_epoch=1.070]         
Epoch 24:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.070, train_loss_epoch=1.070]
Epoch 41:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.427, train_loss_epoch=0.427]         
Epoch 57: 100%|██████████| 1/1 [00:00<00:00, 190.56it/s, v_num=0, train_loss_step=0.618, train_loss_epoch=0.305]
Epoch 58:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.618, train_loss_epoch=0.618]         
Epoch 74: 100%|██████████| 1/1 [00:00<00:00, 175.97it/s, v_num=0, train_loss_step=0.816, train_loss_epoch=0

[2m[36m(train_tune pid=713766)[0m Global seed set to 3


Epoch 18:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.850, train_loss_epoch=4.850]         
Epoch 34:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.190, train_loss_epoch=1.190]         
Epoch 35:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.530, train_loss_epoch=1.530]         
Epoch 51:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.130, train_loss_epoch=1.130]         
Epoch 67:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.830, train_loss_epoch=1.830]         
Epoch 67: 100%|██████████| 1/1 [00:00<00:00, 174.25it/s, v_num=0, train_loss_step=1.360, train_loss_epoch=1.360]
Epoch 68:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.360, train_loss_epoch=1.360]         
Epoch 84:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.340, train_loss_epoch=1.340]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 183.88it/s, v_num=0, train_loss_step=349.0, train_l

[2m[36m(train_tune pid=713766)[0m Global seed set to 11


Epoch 5: 100%|██████████| 1/1 [00:00<00:00, 180.61it/s, v_num=0, train_loss_step=5.150, train_loss_epoch=2.430]
Epoch 6:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.150, train_loss_epoch=5.150]         
Epoch 22:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.741, train_loss_epoch=0.741]         
Epoch 38:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.230, train_loss_epoch=1.230]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.496, train_loss_epoch=0.496]         
Epoch 70:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.639, train_loss_epoch=0.639]         
Epoch 85: 100%|██████████| 1/1 [00:00<00:00, 168.42it/s, v_num=0, train_loss_step=0.495, train_loss_epoch=0.495]
Epoch 86:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.495, train_loss_epoch=0.495]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 180.46it/s, v_num=0, train_loss_step=0.278, train_los

[2m[36m(train_tune pid=713766)[0m Global seed set to 14


Epoch 4:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.993, train_loss_epoch=0.993]         
Epoch 20: 100%|██████████| 1/1 [00:00<00:00, 193.80it/s, v_num=0, train_loss_step=1.530, train_loss_epoch=1.530]
Epoch 21:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.721, train_loss_epoch=0.721]         
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.762, train_loss_epoch=0.762]         
Epoch 54:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.648, train_loss_epoch=0.648]         
Epoch 70:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.251, train_loss_epoch=0.251]         
Epoch 70: 100%|██████████| 1/1 [00:00<00:00, 194.60it/s, v_num=0, train_loss_step=0.251, train_loss_epoch=0.251]
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.495, train_loss_epoch=0.495]         
Epoch 87:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.700, train_loss_epoch=

[2m[36m(train_tune pid=713766)[0m Global seed set to 13


Epoch 34:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.720, train_loss_epoch=4.720]         
Epoch 51:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.980, train_loss_epoch=1.980]         
Epoch 51: 100%|██████████| 1/1 [00:00<00:00, 187.50it/s, v_num=0, train_loss_step=6.240, train_loss_epoch=6.240]
Epoch 52:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=6.240, train_loss_epoch=6.240]         
Epoch 67: 100%|██████████| 1/1 [00:00<00:00, 143.34it/s, v_num=0, train_loss_step=3.920, train_loss_epoch=0.856]
Epoch 68:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.920, train_loss_epoch=3.920]         
Epoch 84:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.888, train_loss_epoch=0.888]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 196.76it/s, v_num=0, train_loss_step=370.0, train_loss_epoch=1.440]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=713766)[0m Global seed set to 3


Epoch 5:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=146.0, train_loss_epoch=146.0]           
Epoch 21:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=135.0, train_loss_epoch=135.0]         
Epoch 21: 100%|██████████| 1/1 [00:00<00:00, 184.32it/s, v_num=0, train_loss_step=92.00, train_loss_epoch=135.0]
Epoch 22:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=92.00, train_loss_epoch=92.00]         
Epoch 38:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=75.80, train_loss_epoch=75.80]             
Epoch 38: 100%|██████████| 1/1 [00:00<00:00, 176.28it/s, v_num=0, train_loss_step=290.0, train_loss_epoch=290.0]
Epoch 39:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=290.0, train_loss_epoch=290.0]         
Epoch 55:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=293.0, train_loss_epoch=293.0]         
Epoch 55: 100%|██████████| 1/1 [00:00<00:00, 191.15it/s, v_num=0, train_loss_step=545.0, tr

[2m[36m(train_tune pid=713766)[0m Global seed set to 17


Epoch 14:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.120, train_loss_epoch=1.120]         
Epoch 30:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.349, train_loss_epoch=0.349]         
Epoch 46:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.240, train_loss_epoch=1.240]         
Epoch 62:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.687, train_loss_epoch=0.687]         
Epoch 78:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.777, train_loss_epoch=0.777]         
Epoch 94:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.885, train_loss_epoch=0.885]         
Epoch 94: 100%|██████████| 1/1 [00:00<00:00, 175.91it/s, v_num=0, train_loss_step=1.400, train_loss_epoch=0.885]
Epoch 95:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.400, train_loss_epoch=1.400]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 181.72it/s, v_num=0, train_loss_step=0.760, train_l

[2m[36m(train_tune pid=713766)[0m Global seed set to 5


Epoch 4:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.802, train_loss_epoch=0.802]         
Epoch 20:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.954, train_loss_epoch=0.954]         
Epoch 36:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.950, train_loss_epoch=0.950]         
Epoch 36: 100%|██████████| 1/1 [00:00<00:00, 185.17it/s, v_num=0, train_loss_step=0.404, train_loss_epoch=0.950]
Epoch 37:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.404, train_loss_epoch=0.404]         
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.020, train_loss_epoch=1.020]         
Epoch 69:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=14.10, train_loss_epoch=14.10]         
Epoch 85:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.456, train_loss_epoch=0.456]         
Epoch 85: 100%|██████████| 1/1 [00:00<00:00, 183.41it/s, v_num=0, train_loss_step=1.040, train_lo

[2m[36m(train_tune pid=713766)[0m Global seed set to 10


Epoch 10:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.120, train_loss_epoch=1.120]        
Epoch 11:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.904, train_loss_epoch=0.904]         
Epoch 27:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.220, train_loss_epoch=1.220]         
Epoch 43:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.270, train_loss_epoch=1.270]         
Epoch 59:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.669, train_loss_epoch=0.669]         
Epoch 59:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.639, train_loss_epoch=0.639]         
Epoch 60:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.639, train_loss_epoch=0.639]
Epoch 76:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.933, train_loss_epoch=0.933]         
Epoch 92:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.591, train_loss_epoch=0.591]   

[2m[36m(train_tune pid=713766)[0m Global seed set to 9


Epoch 8:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.920, train_loss_epoch=2.920]         
Epoch 23: 100%|██████████| 1/1 [00:00<00:00, 164.74it/s, v_num=0, train_loss_step=3.960, train_loss_epoch=3.960]
Epoch 24:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.960, train_loss_epoch=3.960]         
Epoch 39: 100%|██████████| 1/1 [00:00<00:00, 168.34it/s, v_num=0, train_loss_step=1.340, train_loss_epoch=1.340]
Epoch 40:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.340, train_loss_epoch=1.340]         
Epoch 55: 100%|██████████| 1/1 [00:00<00:00, 168.35it/s, v_num=0, train_loss_step=3.610, train_loss_epoch=3.610]
Epoch 56:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.610, train_loss_epoch=3.610]         
Epoch 71: 100%|██████████| 1/1 [00:00<00:00, 167.74it/s, v_num=0, train_loss_step=1.14e+3, train_loss_epoch=1.14e+3]
Epoch 72:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.14e+3, train_loss_

[2m[36m(train_tune pid=713766)[0m Global seed set to 1


Epoch 36:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.710, train_loss_epoch=2.710]         
Epoch 53:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=4.170, train_loss_epoch=4.170]         
Epoch 70: 100%|██████████| 1/1 [00:00<00:00, 196.57it/s, v_num=0, train_loss_step=2.580, train_loss_epoch=10.30]
Epoch 71:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.580, train_loss_epoch=2.580]         
Epoch 88:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.010, train_loss_epoch=5.010]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 196.90it/s, v_num=0, train_loss_step=4.520, train_loss_epoch=1.450]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 86.78it/s, v_num=0, train_loss_step=4.520, train_loss_epoch=1.450, valid_loss=0.755]
Epoch 103:   0%|          | 0/1 [00

[2m[36m(train_tune pid=713766)[0m Global seed set to 6


Epoch 24:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.920, train_loss_epoch=2.920]         
Epoch 41:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.759, train_loss_epoch=0.759]         
Epoch 58:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.933, train_loss_epoch=0.933]         
Epoch 58: 100%|██████████| 1/1 [00:00<00:00, 202.67it/s, v_num=0, train_loss_step=0.933, train_loss_epoch=0.933]
Epoch 59:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.821, train_loss_epoch=0.821]         
Epoch 76:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.861, train_loss_epoch=0.861]         
Epoch 93:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.120, train_loss_epoch=1.120]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 194.02it/s, v_num=0, train_loss_step=1.590, train_loss_epoch=52.40]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=713766)[0m Global seed set to 13


Epoch 23:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.870, train_loss_epoch=1.870]         
Epoch 40:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.988, train_loss_epoch=0.988]         
Epoch 57:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.735, train_loss_epoch=0.735]         
Epoch 74:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.430, train_loss_epoch=1.430]         
Epoch 91:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.020, train_loss_epoch=1.020]         
Epoch 91: 100%|██████████| 1/1 [00:00<00:00, 194.11it/s, v_num=0, train_loss_step=2.570, train_loss_epoch=1.020]
Epoch 92:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.570, train_loss_epoch=2.570]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 192.97it/s, v_num=0, train_loss_step=4.280, train_loss_epoch=0.508]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=713766)[0m Global seed set to 11


Epoch 14:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.040, train_loss_epoch=1.040]         
Epoch 30:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.928, train_loss_epoch=0.928]         
Epoch 46:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.160, train_loss_epoch=1.160]         
Epoch 61: 100%|██████████| 1/1 [00:00<00:00, 178.86it/s, v_num=0, train_loss_step=0.654, train_loss_epoch=0.257]
Epoch 62:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.654, train_loss_epoch=0.654]         
Epoch 77: 100%|██████████| 1/1 [00:00<00:00, 168.84it/s, v_num=0, train_loss_step=0.993, train_loss_epoch=0.993]
Epoch 78:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.993, train_loss_epoch=0.993]         
Epoch 94:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.823, train_loss_epoch=0.823]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 179.40it/s, v_num=0, train_loss_step=0.895, train_l

[2m[36m(train_tune pid=713766)[0m Global seed set to 18


Epoch 29:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=177.0, train_loss_epoch=177.0]             
Epoch 44:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=10.10, train_loss_epoch=10.10]             
Epoch 44: 100%|██████████| 1/1 [00:00<00:00, 170.65it/s, v_num=0, train_loss_step=9.880, train_loss_epoch=10.10]
Epoch 45:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=9.880, train_loss_epoch=9.880]         
Epoch 60:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.800, train_loss_epoch=2.800]             
Epoch 75:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.140, train_loss_epoch=1.140]         
Epoch 90:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.880, train_loss_epoch=5.880]             
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 167.94it/s, v_num=0, train_loss_step=2.24e+3, train_loss_epoch=1.200]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<

[2m[36m(train_tune pid=713766)[0m Global seed set to 11


Epoch 24:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.850, train_loss_epoch=1.850]         
Epoch 24: 100%|██████████| 1/1 [00:00<00:00, 191.21it/s, v_num=0, train_loss_step=1.850, train_loss_epoch=1.850]
Epoch 25:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.945, train_loss_epoch=0.945]         
Epoch 41:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.180, train_loss_epoch=2.180]         
Epoch 57:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.850, train_loss_epoch=1.850]         
Epoch 73:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.697, train_loss_epoch=0.697]         
Epoch 89:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.240, train_loss_epoch=1.240]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 181.51it/s, v_num=0, train_loss_step=1.070, train_loss_epoch=2.050]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=713766)[0m Global seed set to 1


Epoch 24:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.750, train_loss_epoch=1.750]         
Epoch 39:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.190, train_loss_epoch=1.190]         
Epoch 54: 100%|██████████| 1/1 [00:00<00:00, 171.37it/s, v_num=0, train_loss_step=0.881, train_loss_epoch=0.627]
Epoch 55:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.881, train_loss_epoch=0.881]         
Epoch 70:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.688, train_loss_epoch=0.688]         
Epoch 85: 100%|██████████| 1/1 [00:00<00:00, 173.91it/s, v_num=0, train_loss_step=1.010, train_loss_epoch=0.922]
Epoch 86:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.010, train_loss_epoch=1.010]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 170.23it/s, v_num=0, train_loss_step=10.40, train_loss_epoch=0.667]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=713766)[0m Global seed set to 18


Epoch 32:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.551, train_loss_epoch=0.551]         
Epoch 48:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.698, train_loss_epoch=0.698]         
Epoch 64:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.130, train_loss_epoch=1.130]         
Epoch 80:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.160, train_loss_epoch=1.160]         
Epoch 96:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.408, train_loss_epoch=0.408]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 182.15it/s, v_num=0, train_loss_step=0.346, train_loss_epoch=0.778]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 73.18it/s, v_num=0, train_loss_step=0.346, train_loss_epoch=0.778, valid_loss=0.151]
Epoch 110:   0%|          | 0/1 [00

[2m[36m(train_tune pid=713766)[0m Global seed set to 18


Epoch 22:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.250, train_loss_epoch=3.250]         
Epoch 22: 100%|██████████| 1/1 [00:00<00:00, 173.76it/s, v_num=0, train_loss_step=133.0, train_loss_epoch=133.0]
Epoch 23:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=133.0, train_loss_epoch=133.0]         
Epoch 39:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=7.380, train_loss_epoch=7.380]         
Epoch 39: 100%|██████████| 1/1 [00:00<00:00, 180.66it/s, v_num=0, train_loss_step=3.840, train_loss_epoch=7.380]
Epoch 40:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.840, train_loss_epoch=3.840]         
Epoch 56:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=19.40, train_loss_epoch=19.40]         
Epoch 73:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=2.680, train_loss_epoch=2.680]         
Epoch 89:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.890, train_loss_epoch

[2m[36m(train_tune pid=713766)[0m Global seed set to 17


Epoch 22:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.763, train_loss_epoch=0.763]         
Epoch 39:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.944, train_loss_epoch=0.944]         
Epoch 39: 100%|██████████| 1/1 [00:00<00:00, 196.80it/s, v_num=0, train_loss_step=0.747, train_loss_epoch=0.944]
Epoch 40:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.747, train_loss_epoch=0.747]         
Epoch 57:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.516, train_loss_epoch=0.516]         
Epoch 74:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.219, train_loss_epoch=0.219]         
Epoch 91:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.663, train_loss_epoch=0.663]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 191.46it/s, v_num=0, train_loss_step=0.629, train_loss_epoch=0.319]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valid

[2m[36m(train_tune pid=713766)[0m Global seed set to 13


Epoch 10:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.576, train_loss_epoch=0.576]         
Epoch 11:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.576, train_loss_epoch=0.576]
Epoch 27:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.610, train_loss_epoch=0.610]         
Epoch 44:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.010, train_loss_epoch=1.010]         
Epoch 60:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.210, train_loss_epoch=1.210]         
Epoch 60: 100%|██████████| 1/1 [00:00<00:00, 177.88it/s, v_num=0, train_loss_step=0.804, train_loss_epoch=0.804]
Epoch 61:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.804, train_loss_epoch=0.804]         
Epoch 77:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.851, train_loss_epoch=0.851]         
Epoch 77: 100%|██████████| 1/1 [00:00<00:00, 176.89it/s, v_num=0, train_loss_step=0.846, train_loss_epoch

Global seed set to 10


Epoch 997:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.079, train_loss_epoch=0.079, valid_loss=0.224]           
Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 184.69it/s, v_num=0, train_loss_step=0.217, train_loss_epoch=0.0514, valid_loss=0.224] 
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 74.42it/s, v_num=0, train_loss_step=0.217, train_loss_epoch=0.0514, valid_loss=0.264] 
Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 57.95it/s, v_num=0, train_loss_step=0.217, train_loss_epoch=0.217, valid_loss=0.264] 


Sanity Checking: 0it [00:00, ?it/s]

Training: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

Validation: 0it [00:00, ?it/s]

IOPub message rate exceeded.
The Jupyter server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--ServerApp.iopub_msg_rate_limit`.

Current values:
ServerApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
ServerApp.rate_limit_window=3.0 (secs)

[2m[36m(pid=718828)[0m   from pandas.core.computation.check import NUMEXPR_INSTALLED
[2m[36m(pid=718828)[0m   warn(f"Failed to load image Python extension: {e}")
[2m[36m(train_tune pid=718828)[0m Global seed set to 17
[2m[36m(train_tune pid=718828)[0m --------------------------------------------------------------------------
[2m[36m(train_tune pid=718828)[0m detected:
[2m[36m(train_tune pid=718828)[0m 
[2m[36m(train_tune pid=718828)[0m   Local host:            152-67-225-75
[2m[36m(train_tune pid=718828)[0m   Device name:           mlx5_0
[2m[36m(train_tune pid=718828)[0m   Device vendor ID:      0x02c9
[2m[36m(train_tune pid=718828)[0m   Devic

Sanity Checking DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/1 [00:00<?, ?it/s]                             
Epoch 12:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=35.70, train_loss_epoch=35.70]         
Epoch 26:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=26.10, train_loss_epoch=26.10]         
Epoch 27:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=171.0, train_loss_epoch=171.0]         
Epoch 41:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=10.90, train_loss_epoch=10.90]         
Epoch 55:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=5.450, train_loss_epoch=5.450]         
Epoch 55: 100%|██████████| 1/1 [00:00<00:00, 151.09it/s, v_num=0, train_loss_step=8.270, train_loss_epoch=8.270]
Epoch 56:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=8.270, train_loss_epoch=8.270]         
Epoch 70:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_lo

[2m[36m(train_tune pid=718828)[0m Global seed set to 4


Epoch 0:   0%|          | 0/1 [00:00<?, ?it/s]                             
Epoch 14:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.340, train_loss_epoch=1.340]         
Epoch 14: 100%|██████████| 1/1 [00:00<00:00, 155.34it/s, v_num=0, train_loss_step=1.820, train_loss_epoch=1.820]
Epoch 15:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.820, train_loss_epoch=1.820]         
Epoch 29: 100%|██████████| 1/1 [00:00<00:00, 170.38it/s, v_num=0, train_loss_step=1.060, train_loss_epoch=1.060]
Epoch 30:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.665, train_loss_epoch=0.665]         
Epoch 44:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.633, train_loss_epoch=0.633]         
Epoch 45:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.548, train_loss_epoch=0.548]         
Epoch 59:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.842, train_loss_epoch=0.842]         
Epoch 60:   0%|     

[2m[36m(train_tune pid=718828)[0m Global seed set to 1


Epoch 13:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=737.0, train_loss_epoch=737.0]            
Epoch 28:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=39.30, train_loss_epoch=39.30]         
Epoch 43:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=189.0, train_loss_epoch=189.0]             
Epoch 58:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=83.50, train_loss_epoch=83.50]             
Epoch 73: 100%|██████████| 1/1 [00:00<00:00, 175.63it/s, v_num=0, train_loss_step=0.431, train_loss_epoch=0.431]
Epoch 74:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.410, train_loss_epoch=1.410]         
Epoch 89:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=3.060, train_loss_epoch=3.060]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 169.73it/s, v_num=0, train_loss_step=3.400, train_loss_epoch=222.0]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/

[2m[36m(train_tune pid=718828)[0m Global seed set to 9


Epoch 3:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=78.60, train_loss_epoch=78.60]             
Epoch 17:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=310.0, train_loss_epoch=310.0]         
Epoch 17: 100%|██████████| 1/1 [00:00<00:00, 153.55it/s, v_num=0, train_loss_step=206.0, train_loss_epoch=206.0]
Epoch 18:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=206.0, train_loss_epoch=206.0]         
Epoch 32:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=85.90, train_loss_epoch=85.90]         
Epoch 32: 100%|██████████| 1/1 [00:00<00:00, 154.16it/s, v_num=0, train_loss_step=61.60, train_loss_epoch=61.60]
Epoch 33:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=61.60, train_loss_epoch=61.60]         
Epoch 47:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=353.0, train_loss_epoch=353.0]         
Epoch 47: 100%|██████████| 1/1 [00:00<00:00, 153.60it/s, v_num=0, train_loss_step=119.0, trai

[2m[36m(train_tune pid=718828)[0m Global seed set to 7


Epoch 4:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.720, train_loss_epoch=1.720]         
Epoch 19:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.981, train_loss_epoch=0.981]         
Epoch 34:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.873, train_loss_epoch=0.873]         
Epoch 49:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.422, train_loss_epoch=0.422]         
Epoch 64:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=12.60, train_loss_epoch=12.60]         
Epoch 79:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.852, train_loss_epoch=0.852]         
Epoch 94:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.779, train_loss_epoch=0.779]         
Epoch 99: 100%|██████████| 1/1 [00:00<00:00, 167.39it/s, v_num=0, train_loss_step=0.892, train_loss_epoch=0.692]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Valida

[2m[36m(train_tune pid=718828)[0m Global seed set to 17


Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 164.84it/s, v_num=0, train_loss_step=0.0905, train_loss_epoch=0.299, valid_loss=0.178]
Validation: 0it [00:00, ?it/s][A[0m 
Validation:   0%|          | 0/1 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/1 [00:00<?, ?it/s][A
Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 78.70it/s, v_num=0, train_loss_step=0.0905, train_loss_epoch=0.299, valid_loss=0.186] 
Epoch 999: 100%|██████████| 1/1 [00:00<00:00, 60.29it/s, v_num=0, train_loss_step=0.0905, train_loss_epoch=0.0905, valid_loss=0.186]
Epoch 5:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=1.750, train_loss_epoch=1.750]         
Epoch 20:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.836, train_loss_epoch=0.836]         
Epoch 20: 100%|██████████| 1/1 [00:00<00:00, 159.16it/s, v_num=0, train_loss_step=0.838, train_loss_epoch=0.838]
Epoch 21:   0%|          | 0/1 [00:00<?, ?it/s, v_num=0, train_loss_step=0.838, train_loss_epoch=0.838]   