In [22]:
import os
import sys

import torch
import torch.nn as nn
import torch.optim as optim
from torch.utils.data import DataLoader, TensorDataset
from tqdm import tqdm

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt

from models import new_models
from config import load_data

from ray import tune
from ray.air.integrations.mlflow import MLflowLoggerCallback
from ray.tune.schedulers import ASHAScheduler
from torch.optim.lr_scheduler import ReduceLROnPlateau

import mlflow
from mlflow.tracking import MlflowClient

# Training setup

In [23]:
def fit(net, loss_function, optimizer, data_loader, num_epochs, mode, lr_scheduler, use_amp=False):
    scaler = torch.cuda.amp.GradScaler(enabled=use_amp) # Mixed-precision support for compatible GPUs
    for epoch in range(num_epochs):
        if epoch < num_epochs - 1:
            keys = ["train", "val"]
        else:
            keys = ["train", "val", "test"]
        for key in keys:
            dataset_size = 0
            dataset_loss = 0.0
            if key == "train":
                net.train()
            else:
                net.eval()
            for X_batch, y_batch in tqdm(data_loader[key]):
                X_batch, y_batch = X_batch.to(mode["device"]), y_batch.to(mode["device"])
                with torch.set_grad_enabled(mode=(key=="train")): # Autograd activated only during training
                    with torch.cuda.amp.autocast(enabled=False): # Mixed-precision support for compatible GPUs
                        batch_output = net(X_batch.float())
                        batch_loss = loss_function(batch_output, y_batch)
                    if key == "train":
                        scaler.scale(batch_loss).backward()
                        scaler.step(optimizer) 	
                        scaler.update()
                        optimizer.zero_grad()
                dataset_size += y_batch.shape[0]
                dataset_loss += y_batch.shape[0] * batch_loss.item()

            dataset_loss /= dataset_size

            # Report results to Ray Tune
            if key == "train":
                tune.report(train_loss=dataset_loss)
            elif key == "val":
                # Update learning rate
                lr_scheduler.step(metrics=dataset_loss)
                tune.report(val_loss=dataset_loss)
            else:
                tune.report(test_loss=dataset_loss)
    return net

In [24]:
from config import load_data

def train_model(config, data_dir):

    use_GPU = torch.cuda.is_available()
    if use_GPU:
        mode = {"name": "cuda", "device": torch.device("cuda")}
    else:
        mode = {"name": "cpu", "device": torch.device("cpu")}

    # Define hyperparameters
    train_size = 0.7
    val_size = 0.2
    test_size = 0.1

    sequence_length = config['sequence_length']
    batch_size = config['batch_size']
    num_epochs = config['num_epochs']
    lr = config['lr']
    weight_decay = config['weigth_decay']
    vars = config['variables']

    ld = load_data(data_dir = data_dir, target_variable = config['target_variable'])
    
    X, y = ld.create_lagged_matrix(window_size=sequence_length, vars_to_lag=vars)

    X_train, y_train, X_val, y_val, X_test, y_test = ld.split_data(X, y, train_size=train_size, val_size=val_size, test_size=test_size)

    train_dataloader = ld.create_dataloader(X_train, y_train, sequence_length, batch_size=batch_size, shuffle=True)
    val_dataloader = ld.create_dataloader(X_val, y_val, sequence_length, batch_size=batch_size, shuffle=True)
    test_dataloader = ld.create_dataloader(X_test, y_test, sequence_length, batch_size=batch_size, shuffle=False)
    
    # Model inputs
    if vars:
        input_size = len(vars) + 1
    else:
        input_size = 1
    hidden_size = config['hidden_size']
    num_layers = config['num_layers']
    output_size = 1

    if config['arch'] == "FCN":
        net = new_models.FCN(input_size,
                    hidden_size,
                    num_layers,
                    output_size,
                    )
    elif config['arch'] ==  "FCNTemporalAttention":
        net = new_models.FCNTemporalAttention(input_size,
                    hidden_size,
                    num_layers,
                    output_size,
                    )
    elif config['arch'] == "LSTM":
        net = new_models.LSTM(input_size,
                    hidden_size,
                    num_layers,
                    output_size,
                    )
    elif config['arch'] == "LSTMTemporalAttention":
        net = new_models.LSTMTemporalAttention(input_size,
                    hidden_size,
                    num_layers,
                    output_size,
                    )
    elif config['arch'] == "LSTMSpatialTemporalAttention":
        net = new_models.LSTMSpatialTemporalAttention(input_size,
                    hidden_size,
                    num_layers,
                    output_size,
                    )

    data_loader = {
    "train": train_dataloader,
    "val": val_dataloader,
    "test": test_dataloader,
    }
    
    net.to(mode["device"])

    loss_function = nn.MSELoss().to(mode["device"])
    optimizer = optim.Adam(net.parameters(), lr=lr, weight_decay=weight_decay)

    # Define your learning rate scheduler
    lr_scheduler = ReduceLROnPlateau(optimizer, mode='min', factor=0.5, patience=5, verbose=True)
                                           
    best_net = fit(net, loss_function, optimizer, data_loader, num_epochs, mode, lr_scheduler, use_amp=True)
    out_name = ""
    for k, v in config.items():
        if not k in ['weights_dir', 'cwd', 'variables']:
            out_name += '{}-{}_'.format(k, v)
    torch.save(best_net.state_dict(), os.path.join(config['cwd'], config['weights_dir'], out_name[:-1] + '.pth'))

# MLFlow setup

In [25]:
client = MlflowClient()
cwd = os.getcwd()
exp_base_name = "Test_of_interface"

created = 0
for i in range(100):
    try:
        exp_name = exp_base_name+"_{}".format(i)
        experiment_id = client.create_experiment(exp_name)
        created=1
        break
    except (TypeError, mlflow.exceptions.MlflowException):
        continue

if not created:
    print("ERROR: Try new experiment name.")
    sys.exit(1)

weights_root = "./model_weights/"
weights_dir = weights_root+exp_name+'/'
os.mkdir(weights_dir)

In [26]:
data_dir = "./data/"
target_variable = 'Flow_Kalltveit'

# Start experiments

In [27]:
Discharge = ['Flow_Tapping', 'Flow_Lyngsaana']
HBV = ['Mean_Flow_HBV',
 'Flow_HBV',
 'Evaporation_HBV',
 'SNOW_MELT_HBV',
 'Precipitation_HBV',
 'Groundwater_Storage_HBV',
 'Temperature_HBV',
 'Soil_Water_Storage_HBV']
Loggers = ['Water_Level_Lyngsaana',
 'Water_Temperature_Hiafossen',
 'Water_Level_Hiafossen',
 'Water_Level_Kalltveit',
 'Water_Temperature_Kalltveit_Kum',
 'Water_Temperature_Hiavatn',
 'Water_Level_Hiavatn',
 'Water_Temperature_Musdalsvatn',
 'Water_Level_Musdalsvatn',
 'Water_Temperature_Musdalsvatn_Downstream',
 'Water_Level_Musdalsvatn_Downstream',
 'Water_Temperature_Viglesdalsvatn',
 'Water_Level_Viglesdalsvatn',
 'Water_Temperature_Lyngsaana',
 'Water_Temperature_Kalltveit_River']
Loggers_1 = ['Water_Temperature_Lyngsaana', 'Water_Level_Lyngsaana']
Loggers_2 = ['Water_Temperature_Kalltveit_Kum', 'Water_Level_Kalltveit']
Loggers_3 = ['Water_Temperature_Hiavatn', 'Water_Level_Hiavatn']
Loggers_4 = ['Water_Temperature_Musdalsvatn', 'Water_Level_Musdalsvatn']
Loggers_5 = ['Water_Temperature_Musdalsvatn_Downstream',
 'Water_Level_Musdalsvatn_Downstream']
Loggers_6 = ['Water_Temperature_Viglesdalsvatn', 'Water_Level_Viglesdalsvatn']
Loggers_7 = ['Water_Temperature_Kalltveit_River']
Loggers_8 = ['Water_Level_Hiafossen']
Meto = ['Precipitation_Nilsebu',
 'Precipitation_Fister',
 'Air_Temperature_Fister',
 'Air_Temperature_Nilsebu',
 'Relative_Humidity_Nilsebu',
 'Wind_Direction_Nilsebu']
Meto_1 = ['Precipitation_Nilsebu',
 'Air_Temperature_Nilsebu',
 'Relative_Humidity_Nilsebu',
 'Wind_Direction_Nilsebu']
Meto_2 = ['Precipitation_Fister', 'Air_Temperature_Fister']
Meto_Pre_Air_Nilsebu = ['Precipitation_Nilsebu', 'Air_Temperature_Nilsebu']
Meto_Pre_Air_Fister = ['Precipitation_Fister', 'Air_Temperature_Fister']


In [28]:
from functools import partial

config = {
    "mlflow_experiment_id": experiment_id,
    "weights_dir": weights_dir,
    "cwd": cwd,
    "target_variable": target_variable,
    "arch": tune.grid_search(["LSTM", "LSTMTemporalAttention"]), # "FCN", "FCNTemporalAttention", "LSTMTemporalAttention", "LSTM", "LSTMSpatialAttention", "LSTMSpatialTemporalAttention"
    "sequence_length": tune.choice([25]),
    'num_epochs': tune.choice([150]),
    'num_layers': tune.choice([2, 3, 4]),
    "lr": tune.loguniform(1e-4, 1e-1),
    "weigth_decay": tune.choice([0, 0.001, 0.0001]),
    "batch_size": tune.choice([128, 256, 512]),
    "hidden_size": tune.choice([32, 64]),
    "variables": tune.grid_search([
        Discharge+HBV,
        Discharge+HBV+Meto_1+Loggers_1,
        Discharge+HBV+Meto_2+Loggers_2,
    ])
}

analysis = tune.run(
    partial(train_model, data_dir=data_dir),
    config=config,
    resources_per_trial={"cpu": 12, "gpu": 1},
    num_samples=1,
    callbacks=[MLflowLoggerCallback(experiment_name=exp_name)],
)

0,1
Current time:,2023-03-27 18:37:15
Running for:,00:00:03.98
Memory:,14.9/31.9 GiB

Trial name,status,loc,arch,batch_size,hidden_size,lr,num_epochs,num_layers,sequence_length,variables,weigth_decay
train_model_9f615_00000,RUNNING,127.0.0.1:1316,FCN,512,64,0.000393055,150,2,25,,0.0001
train_model_9f615_00001,PENDING,,FCNTemporalAttention,128,64,0.00526328,150,4,25,,0.0
train_model_9f615_00002,PENDING,,LSTM,128,64,0.000834535,150,4,25,,0.0
train_model_9f615_00003,PENDING,,LSTMTemporalAtt_e350,128,64,0.000760256,150,4,25,,0.001
train_model_9f615_00004,PENDING,,FCN,256,32,0.000105767,150,2,25,['Flow_Tapping'_7548,0.0
train_model_9f615_00005,PENDING,,FCNTemporalAttention,128,64,0.000117294,150,4,25,['Flow_Tapping'_8a48,0.001
train_model_9f615_00006,PENDING,,LSTM,512,32,0.0302384,150,4,25,['Flow_Tapping'_8888,0.0
train_model_9f615_00007,PENDING,,LSTMTemporalAtt_e350,128,32,0.0870142,150,4,25,['Flow_Tapping'_b6c8,0.001
train_model_9f615_00008,PENDING,,FCN,128,32,0.0243872,150,2,25,['Mean_Flow_HBV_3b48,0.001
train_model_9f615_00009,PENDING,,FCNTemporalAttention,256,32,0.0694789,150,3,25,['Mean_Flow_HBV_e888,0.0001


  0%|          | 0/87 [00:00<?, ?it/s]
  1%|          | 1/87 [00:01<02:32,  1.78s/it]
 15%|█▍        | 13/87 [00:01<00:07,  9.40it/s]
 32%|███▏      | 28/87 [00:01<00:02, 22.79it/s]
 51%|█████     | 44/87 [00:02<00:01, 39.07it/s]
 66%|██████▌   | 57/87 [00:02<00:00, 52.09it/s]
 84%|████████▍ | 73/87 [00:02<00:00, 69.98it/s]
100%|██████████| 87/87 [00:02<00:00, 36.39it/s]


Trial name,date,done,episodes_total,experiment_id,hostname,iterations_since_restore,node_ip,pid,time_since_restore,time_this_iter_s,time_total_s,timestamp,timesteps_since_restore,timesteps_total,training_iteration,trial_id,val_loss,warmup_time
train_model_9f615_00000,2023-03-27_18-37-23,False,,723c91fe51eb4cf0a3cc05e24709ba3c,DESKTOP-D4IVECG,14,127.0.0.1,1316,7.76112,0.210976,7.76112,1679935043,0,,14,9f615_00000,36.7247,0.00390506


  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 155.28it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 17%|█▋        | 15/87 [00:00<00:00, 149.50it/s]
 37%|███▋      | 32/87 [00:00<00:00, 157.05it/s]
 55%|█████▌    | 48/87 [00:00<00:00, 155.47it/s]
 74%|███████▎  | 64/87 [00:00<00:00, 153.14it/s]
100%|██████████| 87/87 [00:00<00:00, 155.86it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 319.53it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 17%|█▋        | 15/87 [00:00<00:00, 143.86it/s]
 34%|███▍      | 30/87 [00:00<00:00, 143.71it/s]
 54%|█████▍    | 47/87 [00:00<00:00, 151.16it/s]
 72%|███████▏  | 63/87 [00:00<00:00, 153.00it/s]
100%|██████████| 87/87 [00:00<00:00, 149.18it/s]
100%|██████████| 25/25 [00:00<00:00, 298.37it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 16%|█▌        | 14/87 [00:00<00:00, 136.98it/s]
 33%|███▎      | 29/87 [00:00<00:00, 142.36it/s]
 52%|█████▏    | 45/87 [00:00<00:00, 145.47it/s]
 69%|██████▉   | 60/8

[2m[36m(func pid=1316)[0m Epoch 00015: reducing learning rate of group 0 to 1.9653e-04.


 20%|█▉        | 17/87 [00:00<00:00, 166.60it/s]
 39%|███▉      | 34/87 [00:00<00:00, 163.78it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 165.01it/s]
 78%|███████▊  | 68/87 [00:00<00:00, 164.03it/s]
100%|██████████| 87/87 [00:00<00:00, 157.88it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 76%|███████▌  | 19/25 [00:00<00:00, 122.81it/s]
100%|██████████| 25/25 [00:00<00:00, 144.52it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 20%|█▉        | 17/87 [00:00<00:00, 161.48it/s]
 39%|███▉      | 34/87 [00:00<00:00, 162.88it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 163.17it/s]
 78%|███████▊  | 68/87 [00:00<00:00, 162.61it/s]
100%|██████████| 87/87 [00:00<00:00, 162.85it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 346.57it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 20%|█▉        | 17/87 [00:00<00:00, 166.69it/s]
 39%|███▉      | 34/87 [00:00<00:00, 168.00it/s]
 60%|█████▉    | 52/87 [00:00<00:00, 169.58it/s]
 79%|███████▉  | 69/87 [00:00<00:00, 167.11it/s]
100%|██████

[2m[36m(func pid=1316)[0m Epoch 00021: reducing learning rate of group 0 to 9.8264e-05.


 39%|███▉      | 34/87 [00:00<00:00, 163.99it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 157.59it/s]
 77%|███████▋  | 67/87 [00:00<00:00, 156.70it/s]
100%|██████████| 87/87 [00:00<00:00, 159.03it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 165.44it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 37%|███▋      | 32/87 [00:00<00:00, 155.63it/s]
 56%|█████▋    | 49/87 [00:00<00:00, 158.72it/s]
 76%|███████▌  | 66/87 [00:00<00:00, 161.25it/s]
100%|██████████| 87/87 [00:00<00:00, 159.03it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 334.39it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 18%|█▊        | 16/87 [00:00<00:00, 157.08it/s]
 38%|███▊      | 33/87 [00:00<00:00, 160.90it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 165.12it/s]
 79%|███████▉  | 69/87 [00:00<00:00, 168.30it/s]
100%|██████████| 87/87 [00:00<00:00, 165.30it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 334.57it/s]
  0%|          | 0/87

[2m[36m(func pid=1316)[0m Epoch 00030: reducing learning rate of group 0 to 4.9132e-05.


 37%|███▋      | 32/87 [00:00<00:00, 157.59it/s]
 56%|█████▋    | 49/87 [00:00<00:00, 159.53it/s]
 75%|███████▍  | 65/87 [00:00<00:00, 157.14it/s]
100%|██████████| 87/87 [00:00<00:00, 159.60it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 32%|███▏      | 8/25 [00:00<00:00, 71.26it/s]
100%|██████████| 25/25 [00:00<00:00, 153.28it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 18%|█▊        | 16/87 [00:00<00:00, 159.75it/s]
 39%|███▉      | 34/87 [00:00<00:00, 165.60it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 163.93it/s]
 78%|███████▊  | 68/87 [00:00<00:00, 165.74it/s]
100%|██████████| 87/87 [00:00<00:00, 165.39it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 346.71it/s]
 20%|█▉        | 17/87 [00:00<00:00, 168.55it/s]
 39%|███▉      | 34/87 [00:00<00:00, 167.42it/s]
 60%|█████▉    | 52/87 [00:00<00:00, 169.28it/s]
 80%|████████  | 70/87 [00:00<00:00, 170.77it/s]
100%|██████████| 87/87 [00:00<00:00, 166.98it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|████████

[2m[36m(func pid=1316)[0m Epoch 00036: reducing learning rate of group 0 to 2.4566e-05.


 17%|█▋        | 15/87 [00:00<00:00, 149.70it/s]
 37%|███▋      | 32/87 [00:00<00:00, 158.34it/s]
 56%|█████▋    | 49/87 [00:00<00:00, 159.76it/s]
 75%|███████▍  | 65/87 [00:00<00:00, 159.75it/s]
 93%|█████████▎| 81/87 [00:00<00:00, 153.01it/s]
100%|██████████| 87/87 [00:00<00:00, 154.79it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 147.67it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 20%|█▉        | 17/87 [00:00<00:00, 161.01it/s]
 39%|███▉      | 34/87 [00:00<00:00, 154.90it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 157.98it/s]
 77%|███████▋  | 67/87 [00:00<00:00, 146.52it/s]
100%|██████████| 87/87 [00:00<00:00, 145.49it/s]
100%|██████████| 25/25 [00:00<00:00, 300.79it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 18%|█▊        | 16/87 [00:00<00:00, 155.46it/s]
 37%|███▋      | 32/87 [00:00<00:00, 152.65it/s]
 55%|█████▌    | 48/87 [00:00<00:00, 149.92it/s]
 74%|███████▎  | 64/87 [00:00<00:00, 151.46it/s]
 93%|█████████▎| 81/87 [00:00<00:00, 156.16it/s]
1

[2m[36m(func pid=1316)[0m Epoch 00042: reducing learning rate of group 0 to 1.2283e-05.


 18%|█▊        | 16/87 [00:00<00:00, 156.73it/s]
 37%|███▋      | 32/87 [00:00<00:00, 155.85it/s]
 55%|█████▌    | 48/87 [00:00<00:00, 156.15it/s]
 74%|███████▎  | 64/87 [00:00<00:00, 156.33it/s]
 92%|█████████▏| 80/87 [00:00<00:00, 142.32it/s]
100%|██████████| 87/87 [00:00<00:00, 144.50it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 145.81it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 15%|█▍        | 13/87 [00:00<00:00, 125.23it/s]
 46%|████▌     | 40/87 [00:00<00:00, 129.86it/s]
 61%|██████    | 53/87 [00:00<00:00, 129.75it/s]
 77%|███████▋  | 67/87 [00:00<00:00, 130.20it/s]
100%|██████████| 87/87 [00:00<00:00, 131.59it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 282.12it/s]
 16%|█▌        | 14/87 [00:00<00:00, 132.34it/s]
 32%|███▏      | 28/87 [00:00<00:00, 133.62it/s]
 48%|████▊     | 42/87 [00:00<00:00, 135.70it/s]
 64%|██████▍   | 56/87 [00:00<00:00, 131.64it/s]
 83%|████████▎ | 72/87 [00:00<00:00, 138.85it/s]
1

[2m[36m(func pid=1316)[0m Epoch 00048: reducing learning rate of group 0 to 6.1415e-06.


 31%|███       | 27/87 [00:00<00:00, 127.09it/s]
 48%|████▊     | 42/87 [00:00<00:00, 136.02it/s]
 66%|██████▌   | 57/87 [00:00<00:00, 140.19it/s]
 83%|████████▎ | 72/87 [00:00<00:00, 137.56it/s]
100%|██████████| 87/87 [00:00<00:00, 134.74it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 32%|███▏      | 8/25 [00:00<00:00, 64.02it/s]
100%|██████████| 25/25 [00:00<00:00, 135.89it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 32%|███▏      | 28/87 [00:00<00:00, 139.19it/s]
 51%|█████     | 44/87 [00:00<00:00, 147.27it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 151.76it/s]
 87%|████████▋ | 76/87 [00:00<00:00, 153.29it/s]
100%|██████████| 87/87 [00:00<00:00, 144.78it/s]
100%|██████████| 25/25 [00:00<00:00, 283.22it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 16%|█▌        | 14/87 [00:00<00:00, 133.43it/s]
 32%|███▏      | 28/87 [00:00<00:00, 118.67it/s]
 49%|████▉     | 43/87 [00:00<00:00, 130.95it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 142.59it/s]
 87%|████████▋ | 76/87 [00:00<00:00, 147.70it/s]
100

[2m[36m(func pid=1316)[0m Epoch 00054: reducing learning rate of group 0 to 3.0707e-06.


 17%|█▋        | 15/87 [00:00<00:00, 147.05it/s]
 36%|███▌      | 31/87 [00:00<00:00, 153.87it/s]
 54%|█████▍    | 47/87 [00:00<00:00, 156.52it/s]
 72%|███████▏  | 63/87 [00:00<00:00, 153.15it/s]
 91%|█████████ | 79/87 [00:00<00:00, 149.26it/s]
100%|██████████| 87/87 [00:00<00:00, 148.84it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 152.23it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 20%|█▉        | 17/87 [00:00<00:00, 160.55it/s]
 39%|███▉      | 34/87 [00:00<00:00, 162.17it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 161.86it/s]
 78%|███████▊  | 68/87 [00:00<00:00, 158.38it/s]
100%|██████████| 87/87 [00:00<00:00, 157.37it/s]
100%|██████████| 25/25 [00:00<00:00, 332.56it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 18%|█▊        | 16/87 [00:00<00:00, 159.95it/s]
 37%|███▋      | 32/87 [00:00<00:00, 157.18it/s]
 55%|█████▌    | 48/87 [00:00<00:00, 158.33it/s]
 93%|█████████▎| 81/87 [00:00<00:00, 157.78it/s]
100%|██████████| 87/87 [00:00<00:00, 157.53it/s]
 

[2m[36m(func pid=1316)[0m Epoch 00060: reducing learning rate of group 0 to 1.5354e-06.


 17%|█▋        | 15/87 [00:00<00:00, 144.11it/s]
 36%|███▌      | 31/87 [00:00<00:00, 148.79it/s]
 55%|█████▌    | 48/87 [00:00<00:00, 154.30it/s]
 74%|███████▎  | 64/87 [00:00<00:00, 151.29it/s]
100%|██████████| 87/87 [00:00<00:00, 145.92it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 154.38it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 17%|█▋        | 15/87 [00:00<00:00, 145.78it/s]
 37%|███▋      | 32/87 [00:00<00:00, 157.30it/s]
 56%|█████▋    | 49/87 [00:00<00:00, 160.07it/s]
 76%|███████▌  | 66/87 [00:00<00:00, 158.34it/s]
100%|██████████| 87/87 [00:00<00:00, 158.25it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 319.77it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 18%|█▊        | 16/87 [00:00<00:00, 154.10it/s]
 37%|███▋      | 32/87 [00:00<00:00, 156.57it/s]
 56%|█████▋    | 49/87 [00:00<00:00, 161.16it/s]
 76%|███████▌  | 66/87 [00:00<00:00, 160.22it/s]
100%|██████████| 87/87 [00:00<00:00, 159.37it/s]
100%|██████

[2m[36m(func pid=1316)[0m Epoch 00066: reducing learning rate of group 0 to 7.6769e-07.


  0%|          | 0/87 [00:00<?, ?it/s]
 16%|█▌        | 14/87 [00:00<00:00, 134.09it/s]
 32%|███▏      | 28/87 [00:00<00:00, 136.73it/s]
 48%|████▊     | 42/87 [00:00<00:00, 135.75it/s]
 64%|██████▍   | 56/87 [00:00<00:00, 136.97it/s]
 80%|████████  | 70/87 [00:00<00:00, 129.68it/s]
100%|██████████| 87/87 [00:00<00:00, 131.93it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 32%|███▏      | 8/25 [00:00<00:00, 69.66it/s]
100%|██████████| 25/25 [00:00<00:00, 141.99it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 16%|█▌        | 14/87 [00:00<00:00, 132.99it/s]
 32%|███▏      | 28/87 [00:00<00:00, 130.53it/s]
 48%|████▊     | 42/87 [00:00<00:00, 131.59it/s]
 64%|██████▍   | 56/87 [00:00<00:00, 133.74it/s]
 80%|████████  | 70/87 [00:00<00:00, 132.28it/s]
 97%|█████████▋| 84/87 [00:00<00:00, 134.68it/s]
100%|██████████| 87/87 [00:00<00:00, 133.40it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 299.76it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 17%|█▋        | 15/87 

[2m[36m(func pid=1316)[0m Epoch 00072: reducing learning rate of group 0 to 3.8384e-07.


 17%|█▋        | 15/87 [00:00<00:00, 142.48it/s]
 34%|███▍      | 30/87 [00:00<00:00, 138.57it/s]
 51%|█████     | 44/87 [00:00<00:00, 139.03it/s]
 68%|██████▊   | 59/87 [00:00<00:00, 142.08it/s]
 85%|████████▌ | 74/87 [00:00<00:00, 141.34it/s]
100%|██████████| 87/87 [00:00<00:00, 139.98it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 148.89it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 16%|█▌        | 14/87 [00:00<00:00, 133.32it/s]
 33%|███▎      | 29/87 [00:00<00:00, 140.88it/s]
 52%|█████▏    | 45/87 [00:00<00:00, 149.40it/s]
 70%|███████   | 61/87 [00:00<00:00, 151.84it/s]
 89%|████████▊ | 77/87 [00:00<00:00, 150.84it/s]
100%|██████████| 87/87 [00:00<00:00, 150.59it/s]
100%|██████████| 25/25 [00:00<00:00, 342.73it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 18%|█▊        | 16/87 [00:00<00:00, 155.06it/s]
 37%|███▋      | 32/87 [00:00<00:00, 155.27it/s]
 55%|█████▌    | 48/87 [00:00<00:00, 156.67it/s]
 74%|███████▎  | 64/87 [00:00<00:00, 155.61it/s]
 

[2m[36m(func pid=1316)[0m Epoch 00078: reducing learning rate of group 0 to 1.9192e-07.


 32%|███▏      | 28/87 [00:00<00:00, 136.71it/s]
 48%|████▊     | 42/87 [00:00<00:00, 137.75it/s]
 66%|██████▌   | 57/87 [00:00<00:00, 139.68it/s]
 82%|████████▏ | 71/87 [00:00<00:00, 139.79it/s]
100%|██████████| 87/87 [00:00<00:00, 138.95it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 135.09it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 16%|█▌        | 14/87 [00:00<00:00, 134.15it/s]
 32%|███▏      | 28/87 [00:00<00:00, 130.80it/s]
 64%|██████▍   | 56/87 [00:00<00:00, 135.22it/s]
 80%|████████  | 70/87 [00:00<00:00, 135.18it/s]
100%|██████████| 87/87 [00:00<00:00, 134.80it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 266.15it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 17%|█▋        | 15/87 [00:00<00:00, 141.15it/s]
 34%|███▍      | 30/87 [00:00<00:00, 142.78it/s]
 52%|█████▏    | 45/87 [00:00<00:00, 141.64it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 136.90it/s]
 86%|████████▌ | 75/87 [00:00<00:00, 137.29it/s]
100%|██████

[2m[36m(func pid=1316)[0m Epoch 00084: reducing learning rate of group 0 to 9.5961e-08.


 37%|███▋      | 32/87 [00:00<00:00, 150.35it/s]
 55%|█████▌    | 48/87 [00:00<00:00, 143.17it/s]
 72%|███████▏  | 63/87 [00:00<00:00, 141.13it/s]
100%|██████████| 87/87 [00:00<00:00, 147.09it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 163.51it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 18%|█▊        | 16/87 [00:00<00:00, 153.49it/s]
 55%|█████▌    | 48/87 [00:00<00:00, 155.91it/s]
 75%|███████▍  | 65/87 [00:00<00:00, 157.04it/s]
 94%|█████████▍| 82/87 [00:00<00:00, 159.29it/s]
100%|██████████| 87/87 [00:00<00:00, 156.41it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 335.53it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 17%|█▋        | 15/87 [00:00<00:00, 145.35it/s]
 34%|███▍      | 30/87 [00:00<00:00, 145.55it/s]
 52%|█████▏    | 45/87 [00:00<00:00, 144.24it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 144.67it/s]
100%|██████████| 87/87 [00:00<00:00, 145.89it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/2

[2m[36m(func pid=1316)[0m Epoch 00090: reducing learning rate of group 0 to 4.7980e-08.


 36%|███▌      | 31/87 [00:00<00:00, 137.22it/s]
 52%|█████▏    | 45/87 [00:00<00:00, 135.72it/s]
 68%|██████▊   | 59/87 [00:00<00:00, 135.17it/s]
 85%|████████▌ | 74/87 [00:00<00:00, 138.02it/s]
100%|██████████| 87/87 [00:00<00:00, 136.57it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 144.31it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 31%|███       | 27/87 [00:00<00:00, 130.85it/s]
 49%|████▉     | 43/87 [00:00<00:00, 142.25it/s]
 68%|██████▊   | 59/87 [00:00<00:00, 146.91it/s]
 86%|████████▌ | 75/87 [00:00<00:00, 149.93it/s]
100%|██████████| 87/87 [00:00<00:00, 146.50it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 334.85it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 33%|███▎      | 29/87 [00:00<00:00, 141.47it/s]
 51%|█████     | 44/87 [00:00<00:00, 142.51it/s]
 68%|██████▊   | 59/87 [00:00<00:00, 144.33it/s]
 86%|████████▌ | 75/87 [00:00<00:00, 147.78it/s]
100%|██████████| 87/87 [00:00<00:00, 146.68it/s]
  0%|      

[2m[36m(func pid=1316)[0m Epoch 00096: reducing learning rate of group 0 to 2.3990e-08.


 20%|█▉        | 17/87 [00:00<00:00, 160.92it/s]
 39%|███▉      | 34/87 [00:00<00:00, 152.65it/s]
 57%|█████▋    | 50/87 [00:00<00:00, 154.50it/s]
 76%|███████▌  | 66/87 [00:00<00:00, 154.50it/s]
100%|██████████| 87/87 [00:00<00:00, 148.28it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 156.42it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 18%|█▊        | 16/87 [00:00<00:00, 155.09it/s]
 37%|███▋      | 32/87 [00:00<00:00, 155.02it/s]
 55%|█████▌    | 48/87 [00:00<00:00, 155.31it/s]
 75%|███████▍  | 65/87 [00:00<00:00, 157.50it/s]
 94%|█████████▍| 82/87 [00:00<00:00, 158.98it/s]
100%|██████████| 87/87 [00:00<00:00, 157.55it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 299.73it/s]
 16%|█▌        | 14/87 [00:00<00:00, 133.61it/s]
 32%|███▏      | 28/87 [00:00<00:00, 135.02it/s]
 48%|████▊     | 42/87 [00:00<00:00, 135.43it/s]
 67%|██████▋   | 58/87 [00:00<00:00, 142.14it/s]
 85%|████████▌ | 74/87 [00:00<00:00, 146.43it/s]
1

[2m[36m(func pid=1316)[0m Epoch 00102: reducing learning rate of group 0 to 1.1995e-08.


 36%|███▌      | 31/87 [00:00<00:00, 152.32it/s]
 54%|█████▍    | 47/87 [00:00<00:00, 152.97it/s]
 72%|███████▏  | 63/87 [00:00<00:00, 153.87it/s]
100%|██████████| 87/87 [00:00<00:00, 151.00it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 148.95it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 18%|█▊        | 16/87 [00:00<00:00, 154.85it/s]
 37%|███▋      | 32/87 [00:00<00:00, 157.22it/s]
 55%|█████▌    | 48/87 [00:00<00:00, 154.30it/s]
 74%|███████▎  | 64/87 [00:00<00:00, 154.69it/s]
100%|██████████| 87/87 [00:00<00:00, 150.80it/s]
100%|██████████| 25/25 [00:00<00:00, 297.83it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 16%|█▌        | 14/87 [00:00<00:00, 136.11it/s]
 33%|███▎      | 29/87 [00:00<00:00, 139.84it/s]
 52%|█████▏    | 45/87 [00:00<00:00, 143.91it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 144.60it/s]
100%|██████████| 87/87 [00:00<00:00, 146.48it/s]
100%|██████████| 25/25 [00:00<00:00, 336.19it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 18%|█▊    

[2m[36m(func pid=21900)[0m Epoch 00008: reducing learning rate of group 0 to 2.6316e-03.


  9%|▊         | 30/346 [00:00<00:02, 138.50it/s]
 13%|█▎        | 44/346 [00:00<00:02, 135.45it/s]
 17%|█▋        | 58/346 [00:00<00:02, 132.40it/s]
 21%|██        | 72/346 [00:00<00:02, 130.52it/s]
 29%|██▉       | 101/346 [00:00<00:01, 136.86it/s]
 33%|███▎      | 115/346 [00:00<00:01, 137.37it/s]
 38%|███▊      | 130/346 [00:00<00:01, 138.45it/s]
 42%|████▏     | 144/346 [00:01<00:01, 138.18it/s]
 46%|████▌     | 158/346 [00:01<00:01, 136.74it/s]
 50%|█████     | 173/346 [00:01<00:01, 138.29it/s]
 54%|█████▍    | 187/346 [00:01<00:01, 137.62it/s]
 58%|█████▊    | 201/346 [00:01<00:01, 138.24it/s]
 62%|██████▏   | 216/346 [00:01<00:00, 140.49it/s]
 67%|██████▋   | 231/346 [00:01<00:00, 142.35it/s]
 71%|███████   | 246/346 [00:01<00:00, 127.39it/s]
 75%|███████▌  | 260/346 [00:01<00:00, 130.69it/s]
 79%|███████▉  | 275/346 [00:02<00:00, 134.35it/s]
 84%|████████▍ | 290/346 [00:02<00:00, 137.52it/s]
 88%|████████▊ | 304/346 [00:02<00:00, 137.13it/s]
 92%|█████████▏| 319/346 [00:02<00:

[2m[36m(func pid=21900)[0m Epoch 00014: reducing learning rate of group 0 to 1.3158e-03.


  9%|▉         | 32/346 [00:00<00:02, 138.44it/s]
 14%|█▍        | 48/346 [00:00<00:02, 146.41it/s]
 18%|█▊        | 63/346 [00:00<00:01, 145.39it/s]
 28%|██▊       | 96/346 [00:00<00:01, 152.81it/s]
 33%|███▎      | 113/346 [00:00<00:01, 155.55it/s]
 37%|███▋      | 129/346 [00:00<00:01, 155.44it/s]
 42%|████▏     | 145/346 [00:00<00:01, 156.74it/s]
 47%|████▋     | 161/346 [00:01<00:01, 155.69it/s]
 51%|█████     | 177/346 [00:01<00:01, 156.34it/s]
 56%|█████▌    | 193/346 [00:01<00:00, 153.30it/s]
 61%|██████    | 210/346 [00:01<00:00, 156.70it/s]
 65%|██████▌   | 226/346 [00:01<00:00, 154.96it/s]
 70%|███████   | 243/346 [00:01<00:00, 157.28it/s]
 75%|███████▍  | 259/346 [00:01<00:00, 156.14it/s]
 80%|███████▉  | 276/346 [00:01<00:00, 157.87it/s]
 85%|████████▍ | 293/346 [00:01<00:00, 157.67it/s]
 89%|████████▉ | 309/346 [00:02<00:00, 155.97it/s]
 94%|█████████▍| 325/346 [00:02<00:00, 154.61it/s]
  0%|          | 0/99 [00:00<?, ?it/s]
 61%|██████    | 60/99 [00:00<00:00, 594.36it/s

[2m[36m(func pid=21900)[0m Epoch 00020: reducing learning rate of group 0 to 6.5791e-04.


  4%|▍         | 15/346 [00:00<00:02, 143.97it/s]
  9%|▊         | 30/346 [00:00<00:02, 137.30it/s]
 13%|█▎        | 45/346 [00:00<00:02, 140.44it/s]
 17%|█▋        | 60/346 [00:00<00:02, 135.58it/s]
 21%|██▏       | 74/346 [00:00<00:02, 135.46it/s]
 25%|██▌       | 88/346 [00:00<00:01, 134.22it/s]
 30%|██▉       | 103/346 [00:00<00:01, 136.75it/s]
 34%|███▍      | 118/346 [00:00<00:01, 139.44it/s]
 38%|███▊      | 132/346 [00:00<00:01, 128.38it/s]
 42%|████▏     | 146/346 [00:01<00:01, 129.58it/s]
 46%|████▌     | 160/346 [00:01<00:01, 131.24it/s]
 50%|█████     | 174/346 [00:01<00:01, 132.79it/s]
 54%|█████▍    | 188/346 [00:01<00:01, 133.84it/s]
 59%|█████▊    | 203/346 [00:01<00:01, 137.56it/s]
 63%|██████▎   | 217/346 [00:01<00:00, 137.39it/s]
 67%|██████▋   | 232/346 [00:01<00:00, 138.74it/s]
 71%|███████   | 246/346 [00:01<00:00, 134.66it/s]
 79%|███████▉  | 274/346 [00:02<00:00, 134.67it/s]
 83%|████████▎ | 288/346 [00:02<00:00, 133.69it/s]
 87%|████████▋ | 302/346 [00:02<00:00

[2m[36m(func pid=21900)[0m Epoch 00026: reducing learning rate of group 0 to 3.2896e-04.


 10%|▉         | 33/346 [00:00<00:01, 163.02it/s]
 15%|█▍        | 51/346 [00:00<00:01, 166.61it/s]
 20%|█▉        | 68/346 [00:00<00:01, 162.33it/s]
 25%|██▍       | 85/346 [00:00<00:01, 161.89it/s]
 29%|██▉       | 102/346 [00:00<00:01, 160.73it/s]
 34%|███▍      | 119/346 [00:00<00:01, 160.59it/s]
 39%|███▉      | 136/346 [00:00<00:01, 161.84it/s]
 44%|████▍     | 153/346 [00:00<00:01, 158.70it/s]
 49%|████▉     | 169/346 [00:01<00:01, 154.57it/s]
 53%|█████▎    | 185/346 [00:01<00:01, 150.52it/s]
 58%|█████▊    | 201/346 [00:01<00:00, 153.18it/s]
 63%|██████▎   | 217/346 [00:01<00:00, 153.69it/s]
 67%|██████▋   | 233/346 [00:01<00:00, 152.91it/s]
 72%|███████▏  | 249/346 [00:01<00:00, 151.58it/s]
 77%|███████▋  | 265/346 [00:01<00:00, 151.43it/s]
 81%|████████  | 281/346 [00:01<00:00, 150.35it/s]
 86%|████████▌ | 297/346 [00:01<00:00, 148.40it/s]
 90%|█████████ | 313/346 [00:02<00:00, 150.50it/s]
 95%|█████████▌| 329/346 [00:02<00:00, 152.28it/s]
100%|██████████| 346/346 [00:02<00:

[2m[36m(func pid=21900)[0m Epoch 00032: reducing learning rate of group 0 to 1.6448e-04.


  8%|▊         | 27/346 [00:00<00:02, 133.82it/s]
 12%|█▏        | 41/346 [00:00<00:02, 132.45it/s]
 16%|█▌        | 55/346 [00:00<00:02, 131.28it/s]
 20%|█▉        | 69/346 [00:00<00:02, 133.02it/s]
 25%|██▍       | 85/346 [00:00<00:01, 138.22it/s]
 29%|██▊       | 99/346 [00:00<00:01, 137.52it/s]
 33%|███▎      | 113/346 [00:00<00:01, 137.39it/s]
 37%|███▋      | 127/346 [00:00<00:01, 136.40it/s]
 41%|████      | 141/346 [00:01<00:01, 136.77it/s]
 45%|████▌     | 156/346 [00:01<00:01, 138.84it/s]
 49%|████▉     | 170/346 [00:01<00:01, 132.62it/s]
 53%|█████▎    | 184/346 [00:01<00:01, 130.02it/s]
 57%|█████▋    | 198/346 [00:01<00:01, 130.95it/s]
 61%|██████▏   | 212/346 [00:01<00:01, 132.05it/s]
 66%|██████▌   | 227/346 [00:01<00:00, 135.50it/s]
 70%|██████▉   | 241/346 [00:01<00:00, 133.86it/s]
 74%|███████▎  | 255/346 [00:01<00:00, 134.50it/s]
 78%|███████▊  | 269/346 [00:01<00:00, 135.57it/s]
 82%|████████▏ | 284/346 [00:02<00:00, 137.76it/s]
 86%|████████▌ | 298/346 [00:02<00:00




  4%|▍         | 15/346 [00:00<00:02, 143.02it/s]
  9%|▉         | 32/346 [00:00<00:02, 153.19it/s]
 14%|█▍        | 48/346 [00:00<00:01, 152.88it/s]
 18%|█▊        | 64/346 [00:00<00:01, 153.89it/s]
 23%|██▎       | 80/346 [00:00<00:01, 155.97it/s]
 28%|██▊       | 96/346 [00:00<00:01, 140.76it/s]
 32%|███▏      | 111/346 [00:00<00:01, 141.74it/s]
 36%|███▋      | 126/346 [00:00<00:01, 142.46it/s]
 45%|████▌     | 157/346 [00:01<00:01, 145.94it/s]
 50%|█████     | 174/346 [00:01<00:01, 151.03it/s]
 55%|█████▍    | 190/346 [00:01<00:01, 152.47it/s]
 60%|█████▉    | 206/346 [00:01<00:00, 154.34it/s]
 64%|██████▍   | 222/346 [00:01<00:00, 152.35it/s]
 69%|██████▉   | 238/346 [00:01<00:00, 151.95it/s]
 74%|███████▎  | 255/346 [00:01<00:00, 155.63it/s]
 78%|███████▊  | 271/346 [00:01<00:00, 155.29it/s]
 83%|████████▎ | 288/346 [00:01<00:00, 155.85it/s]
 88%|████████▊ | 305/346 [00:02<00:00, 157.14it/s]
 93%|█████████▎| 322/346 [00:02<00:00, 158.82it/s]
 98%|█████████▊| 338/346 [00:02<00:00

[2m[36m(func pid=21900)[0m Epoch 00044: reducing learning rate of group 0 to 4.1119e-05.


  8%|▊         | 28/346 [00:00<00:02, 136.04it/s]
 12%|█▏        | 42/346 [00:00<00:02, 120.64it/s]
 16%|█▋        | 57/346 [00:00<00:02, 129.38it/s]
 21%|██        | 72/346 [00:00<00:02, 134.47it/s]
 25%|██▌       | 87/346 [00:00<00:01, 138.04it/s]
 29%|██▉       | 101/346 [00:00<00:01, 136.46it/s]
 34%|███▎      | 116/346 [00:00<00:01, 139.39it/s]
 38%|███▊      | 131/346 [00:00<00:01, 140.85it/s]
 42%|████▏     | 146/346 [00:01<00:01, 139.00it/s]
 47%|████▋     | 161/346 [00:01<00:01, 139.86it/s]
 51%|█████     | 176/346 [00:01<00:01, 141.62it/s]
 55%|█████▌    | 191/346 [00:01<00:01, 141.48it/s]
 60%|█████▉    | 206/346 [00:01<00:00, 140.76it/s]
 64%|██████▍   | 221/346 [00:01<00:00, 141.31it/s]
 68%|██████▊   | 236/346 [00:01<00:00, 139.02it/s]
 73%|███████▎  | 251/346 [00:01<00:00, 139.83it/s]
 77%|███████▋  | 265/346 [00:01<00:00, 139.80it/s]
 81%|████████  | 279/346 [00:02<00:00, 139.35it/s]
 85%|████████▍ | 293/346 [00:02<00:00, 138.16it/s]
 89%|████████▉ | 308/346 [00:02<00:0

[2m[36m(func pid=21900)[0m Epoch 00050: reducing learning rate of group 0 to 2.0560e-05.


  9%|▉         | 31/346 [00:00<00:02, 148.95it/s]
 14%|█▍        | 48/346 [00:00<00:01, 157.67it/s]
 18%|█▊        | 64/346 [00:00<00:01, 157.18it/s]
 23%|██▎       | 81/346 [00:00<00:01, 160.08it/s]
 29%|██▊       | 99/346 [00:00<00:01, 164.55it/s]
 34%|███▎      | 116/346 [00:00<00:01, 160.22it/s]
 38%|███▊      | 133/346 [00:00<00:01, 158.72it/s]
 43%|████▎     | 149/346 [00:00<00:01, 152.81it/s]
 48%|████▊     | 165/346 [00:01<00:01, 148.63it/s]
 52%|█████▏    | 180/346 [00:01<00:01, 143.98it/s]
 56%|█████▋    | 195/346 [00:01<00:01, 143.08it/s]
 61%|██████    | 210/346 [00:01<00:00, 141.94it/s]
 65%|██████▌   | 226/346 [00:01<00:00, 146.97it/s]
 70%|███████   | 243/346 [00:01<00:00, 151.72it/s]
 80%|████████  | 278/346 [00:01<00:00, 161.23it/s]
 86%|████████▌ | 296/346 [00:01<00:00, 163.90it/s]
 91%|█████████ | 314/346 [00:02<00:00, 166.13it/s]
 96%|█████████▌| 331/346 [00:02<00:00, 165.44it/s]
100%|██████████| 346/346 [00:02<00:00, 155.39it/s]
  0%|          | 0/99 [00:00<?, ?it/

[2m[36m(func pid=21900)[0m Epoch 00056: reducing learning rate of group 0 to 1.0280e-05.


  4%|▍         | 14/346 [00:00<00:02, 138.78it/s]
  8%|▊         | 28/346 [00:00<00:02, 137.08it/s]
 12%|█▏        | 43/346 [00:00<00:02, 137.94it/s]
 16%|█▋        | 57/346 [00:00<00:02, 138.27it/s]
 21%|██        | 72/346 [00:00<00:01, 140.94it/s]
 25%|██▌       | 87/346 [00:00<00:01, 138.92it/s]
 29%|██▉       | 101/346 [00:00<00:01, 138.83it/s]
 34%|███▎      | 116/346 [00:00<00:01, 141.30it/s]
 38%|███▊      | 131/346 [00:00<00:01, 141.32it/s]
 42%|████▏     | 147/346 [00:01<00:01, 144.03it/s]
 47%|████▋     | 163/346 [00:01<00:01, 147.86it/s]
 51%|█████▏    | 178/346 [00:01<00:01, 148.44it/s]
 56%|█████▌    | 193/346 [00:01<00:01, 145.52it/s]
 60%|██████    | 208/346 [00:01<00:00, 146.32it/s]
 64%|██████▍   | 223/346 [00:01<00:00, 145.71it/s]
 69%|██████▉   | 239/346 [00:01<00:00, 147.40it/s]
 78%|███████▊  | 271/346 [00:01<00:00, 151.23it/s]
 83%|████████▎ | 288/346 [00:01<00:00, 156.36it/s]
 88%|████████▊ | 304/346 [00:02<00:00, 155.94it/s]
 93%|█████████▎| 321/346 [00:02<00:00

[2m[36m(func pid=21900)[0m Epoch 00062: reducing learning rate of group 0 to 5.1399e-06.


 10%|▉         | 33/346 [00:00<00:01, 164.26it/s]
 14%|█▍        | 50/346 [00:00<00:01, 158.10it/s]
 19%|█▉        | 66/346 [00:00<00:01, 157.74it/s]
 24%|██▍       | 83/346 [00:00<00:01, 161.51it/s]
 29%|██▉       | 100/346 [00:00<00:01, 161.64it/s]
 34%|███▍      | 117/346 [00:00<00:01, 158.10it/s]
 39%|███▊      | 134/346 [00:00<00:01, 158.97it/s]
 43%|████▎     | 150/346 [00:00<00:01, 159.23it/s]
 48%|████▊     | 166/346 [00:01<00:01, 153.52it/s]
 53%|█████▎    | 182/346 [00:01<00:01, 151.85it/s]
 57%|█████▋    | 198/346 [00:01<00:00, 149.77it/s]
 62%|██████▏   | 214/346 [00:01<00:00, 151.75it/s]
 66%|██████▋   | 230/346 [00:01<00:00, 150.81it/s]
 71%|███████▏  | 247/346 [00:01<00:00, 154.13it/s]
 76%|███████▌  | 263/346 [00:01<00:00, 154.91it/s]
 81%|████████  | 280/346 [00:01<00:00, 157.79it/s]
 86%|████████▌ | 297/346 [00:01<00:00, 158.35it/s]
 90%|█████████ | 313/346 [00:02<00:00, 156.09it/s]
 95%|█████████▌| 329/346 [00:02<00:00, 155.44it/s]
100%|██████████| 346/346 [00:02<00:

[2m[36m(func pid=21900)[0m Epoch 00068: reducing learning rate of group 0 to 2.5700e-06.


  9%|▉         | 32/346 [00:00<00:01, 157.64it/s]
 14%|█▍        | 48/346 [00:00<00:01, 158.15it/s]
 18%|█▊        | 64/346 [00:00<00:01, 156.38it/s]
 23%|██▎       | 81/346 [00:00<00:01, 160.05it/s]
 28%|██▊       | 98/346 [00:00<00:01, 159.68it/s]
 33%|███▎      | 114/346 [00:00<00:01, 158.69it/s]
 38%|███▊      | 130/346 [00:00<00:01, 159.08it/s]
 42%|████▏     | 147/346 [00:00<00:01, 162.01it/s]
 47%|████▋     | 164/346 [00:01<00:01, 162.90it/s]
 52%|█████▏    | 181/346 [00:01<00:01, 158.16it/s]
 57%|█████▋    | 197/346 [00:01<00:00, 153.98it/s]
 62%|██████▏   | 213/346 [00:01<00:00, 151.37it/s]
 66%|██████▌   | 229/346 [00:01<00:00, 149.03it/s]
 71%|███████   | 244/346 [00:01<00:00, 148.99it/s]
 75%|███████▌  | 260/346 [00:01<00:00, 151.78it/s]
 80%|███████▉  | 276/346 [00:01<00:00, 153.24it/s]
 84%|████████▍ | 292/346 [00:01<00:00, 153.05it/s]
 89%|████████▉ | 308/346 [00:01<00:00, 153.78it/s]
 94%|█████████▎| 324/346 [00:02<00:00, 152.70it/s]
  0%|          | 0/99 [00:00<?, ?it/

[2m[36m(func pid=21900)[0m Epoch 00074: reducing learning rate of group 0 to 1.2850e-06.


  9%|▉         | 32/346 [00:00<00:01, 158.30it/s]
 14%|█▍        | 48/346 [00:00<00:02, 142.48it/s]
 19%|█▉        | 65/346 [00:00<00:01, 151.44it/s]
 23%|██▎       | 81/346 [00:00<00:01, 154.20it/s]
 28%|██▊       | 97/346 [00:00<00:01, 153.26it/s]
 33%|███▎      | 113/346 [00:00<00:01, 153.88it/s]
 37%|███▋      | 129/346 [00:00<00:01, 154.71it/s]
 42%|████▏     | 146/346 [00:00<00:01, 156.46it/s]
 47%|████▋     | 162/346 [00:01<00:01, 153.82it/s]
 51%|█████▏    | 178/346 [00:01<00:01, 152.97it/s]
 56%|█████▌    | 194/346 [00:01<00:00, 153.21it/s]
 61%|██████    | 210/346 [00:01<00:00, 151.15it/s]
 65%|██████▌   | 226/346 [00:01<00:00, 149.88it/s]
 70%|██████▉   | 242/346 [00:01<00:00, 151.82it/s]
 75%|███████▍  | 258/346 [00:01<00:00, 153.37it/s]
 84%|████████▍ | 291/346 [00:01<00:00, 156.19it/s]
 89%|████████▉ | 308/346 [00:02<00:00, 158.43it/s]
 94%|█████████▍| 325/346 [00:02<00:00, 160.30it/s]
100%|██████████| 346/346 [00:02<00:00, 154.58it/s]
  0%|          | 0/346 [00:00<?, ?it

[2m[36m(func pid=21900)[0m Epoch 00080: reducing learning rate of group 0 to 6.4249e-07.


  5%|▍         | 16/346 [00:00<00:02, 156.57it/s]
 10%|▉         | 33/346 [00:00<00:01, 158.07it/s]
 14%|█▍        | 49/346 [00:00<00:01, 154.52it/s]
 19%|█▉        | 65/346 [00:00<00:01, 153.30it/s]
 23%|██▎       | 81/346 [00:00<00:01, 150.29it/s]
 28%|██▊       | 97/346 [00:00<00:01, 147.07it/s]
 32%|███▏      | 112/346 [00:00<00:01, 147.33it/s]
 37%|███▋      | 127/346 [00:00<00:01, 147.14it/s]
 41%|████▏     | 143/346 [00:00<00:01, 148.87it/s]
 46%|████▌     | 159/346 [00:01<00:01, 150.64it/s]
 51%|█████     | 175/346 [00:01<00:01, 152.65it/s]
 55%|█████▌    | 191/346 [00:01<00:01, 152.69it/s]
 60%|██████    | 208/346 [00:01<00:00, 156.35it/s]
 65%|██████▍   | 224/346 [00:01<00:00, 152.80it/s]
 70%|██████▉   | 241/346 [00:01<00:00, 155.70it/s]
 75%|███████▍  | 258/346 [00:01<00:00, 157.88it/s]
 79%|███████▉  | 275/346 [00:01<00:00, 160.15it/s]
 84%|████████▍ | 292/346 [00:01<00:00, 160.26it/s]
 89%|████████▉ | 309/346 [00:02<00:00, 159.24it/s]
 94%|█████████▍| 326/346 [00:02<00:00

[2m[36m(func pid=21900)[0m Epoch 00086: reducing learning rate of group 0 to 3.2125e-07.


  9%|▊         | 30/346 [00:00<00:02, 147.10it/s]
 13%|█▎        | 45/346 [00:00<00:02, 143.61it/s]
 17%|█▋        | 60/346 [00:00<00:01, 145.23it/s]
 22%|██▏       | 75/346 [00:00<00:01, 145.83it/s]
 26%|██▋       | 91/346 [00:00<00:01, 150.34it/s]
 36%|███▌      | 124/346 [00:00<00:01, 154.42it/s]
 41%|████      | 141/346 [00:00<00:01, 156.90it/s]
 45%|████▌     | 157/346 [00:01<00:01, 157.28it/s]
 50%|█████     | 174/346 [00:01<00:01, 159.67it/s]
 55%|█████▌    | 191/346 [00:01<00:00, 159.87it/s]
 60%|█████▉    | 207/346 [00:01<00:00, 158.55it/s]
 64%|██████▍   | 223/346 [00:01<00:00, 158.91it/s]
 69%|██████▉   | 239/346 [00:01<00:00, 154.99it/s]
 74%|███████▍  | 256/346 [00:01<00:00, 157.20it/s]
 79%|███████▊  | 272/346 [00:01<00:00, 157.75it/s]
 84%|████████▎ | 289/346 [00:01<00:00, 159.34it/s]
 88%|████████▊ | 305/346 [00:01<00:00, 156.28it/s]
 93%|█████████▎| 322/346 [00:02<00:00, 158.61it/s]
100%|██████████| 346/346 [00:02<00:00, 155.52it/s]
  0%|          | 0/99 [00:00<?, ?it/

[2m[36m(func pid=21900)[0m Epoch 00092: reducing learning rate of group 0 to 1.6062e-07.


  5%|▍         | 16/346 [00:00<00:02, 153.72it/s]
  9%|▉         | 32/346 [00:00<00:02, 152.87it/s]
 19%|█▉        | 65/346 [00:00<00:01, 153.67it/s]
 23%|██▎       | 81/346 [00:00<00:01, 153.50it/s]
 28%|██▊       | 98/346 [00:00<00:01, 156.08it/s]
 33%|███▎      | 115/346 [00:00<00:01, 158.24it/s]
 38%|███▊      | 131/346 [00:00<00:01, 158.27it/s]
 43%|████▎     | 148/346 [00:00<00:01, 159.31it/s]
 47%|████▋     | 164/346 [00:01<00:01, 157.71it/s]
 52%|█████▏    | 181/346 [00:01<00:01, 159.37it/s]
 62%|██████▏   | 214/346 [00:01<00:00, 158.12it/s]
 67%|██████▋   | 231/346 [00:01<00:00, 158.79it/s]
 71%|███████▏  | 247/346 [00:01<00:00, 155.57it/s]
 76%|███████▌  | 263/346 [00:01<00:00, 152.85it/s]
 81%|████████  | 279/346 [00:01<00:00, 151.41it/s]
 85%|████████▌ | 295/346 [00:01<00:00, 150.65it/s]
 90%|████████▉ | 311/346 [00:02<00:00, 148.45it/s]
 94%|█████████▍| 326/346 [00:02<00:00, 147.13it/s]
100%|██████████| 346/346 [00:02<00:00, 153.37it/s]
  0%|          | 0/99 [00:00<?, ?it/

[2m[36m(func pid=21900)[0m Epoch 00098: reducing learning rate of group 0 to 8.0311e-08.


  5%|▌         | 18/346 [00:00<00:01, 173.21it/s]
 10%|█         | 36/346 [00:00<00:01, 168.79it/s]
 15%|█▌        | 53/346 [00:00<00:01, 165.13it/s]
 20%|██        | 70/346 [00:00<00:01, 164.55it/s]
 25%|██▌       | 87/346 [00:00<00:01, 160.81it/s]
 30%|███       | 105/346 [00:00<00:01, 163.50it/s]
 35%|███▌      | 122/346 [00:00<00:01, 161.71it/s]
 40%|████      | 139/346 [00:00<00:01, 159.72it/s]
 45%|████▍     | 155/346 [00:00<00:01, 159.11it/s]
 49%|████▉     | 171/346 [00:01<00:01, 153.41it/s]
 54%|█████▍    | 187/346 [00:01<00:01, 148.66it/s]
 58%|█████▊    | 202/346 [00:01<00:00, 147.25it/s]
 63%|██████▎   | 217/346 [00:01<00:00, 144.39it/s]
 67%|██████▋   | 232/346 [00:01<00:00, 145.02it/s]
 72%|███████▏  | 249/346 [00:01<00:00, 151.45it/s]
 77%|███████▋  | 266/346 [00:01<00:00, 155.02it/s]
 82%|████████▏ | 283/346 [00:01<00:00, 156.99it/s]
 87%|████████▋ | 300/346 [00:01<00:00, 160.38it/s]
 92%|█████████▏| 317/346 [00:02<00:00, 160.44it/s]
 97%|█████████▋| 334/346 [00:02<00:0

[2m[36m(func pid=21900)[0m Epoch 00104: reducing learning rate of group 0 to 4.0156e-08.


  9%|▉         | 31/346 [00:00<00:02, 152.70it/s]
 14%|█▎        | 47/346 [00:00<00:02, 149.40it/s]
 18%|█▊        | 62/346 [00:00<00:01, 145.94it/s]
 22%|██▏       | 77/346 [00:00<00:01, 145.03it/s]
 31%|███       | 107/346 [00:00<00:01, 144.55it/s]
 35%|███▌      | 122/346 [00:00<00:01, 144.97it/s]
 40%|████      | 139/346 [00:00<00:01, 149.92it/s]
 45%|████▍     | 155/346 [00:01<00:01, 151.89it/s]
 50%|████▉     | 172/346 [00:01<00:01, 154.63it/s]
 55%|█████▍    | 189/346 [00:01<00:00, 157.05it/s]
 59%|█████▉    | 205/346 [00:01<00:00, 156.36it/s]
 64%|██████▍   | 222/346 [00:01<00:00, 157.32it/s]
 69%|██████▉   | 238/346 [00:01<00:00, 157.20it/s]
 74%|███████▎  | 255/346 [00:01<00:00, 159.34it/s]
 78%|███████▊  | 271/346 [00:01<00:00, 159.20it/s]
 83%|████████▎ | 287/346 [00:01<00:00, 157.82it/s]
 88%|████████▊ | 303/346 [00:01<00:00, 148.39it/s]
 92%|█████████▏| 320/346 [00:02<00:00, 151.89it/s]
  0%|          | 0/99 [00:00<?, ?it/s]
100%|██████████| 99/99 [00:00<00:00, 622.19it/s

[2m[36m(func pid=21900)[0m Epoch 00110: reducing learning rate of group 0 to 2.0078e-08.


  9%|▉         | 32/346 [00:00<00:02, 153.98it/s]
 14%|█▍        | 48/346 [00:00<00:02, 148.99it/s]
 18%|█▊        | 63/346 [00:00<00:01, 146.05it/s]
 23%|██▎       | 78/346 [00:00<00:01, 146.24it/s]
 27%|██▋       | 93/346 [00:00<00:01, 145.43it/s]
 32%|███▏      | 109/346 [00:00<00:01, 148.71it/s]
 36%|███▋      | 126/346 [00:00<00:01, 152.68it/s]
 41%|████      | 142/346 [00:00<00:01, 141.68it/s]
 46%|████▌     | 158/346 [00:01<00:01, 144.44it/s]
 50%|█████     | 173/346 [00:01<00:01, 144.02it/s]
 55%|█████▍    | 189/346 [00:01<00:01, 147.39it/s]
 60%|█████▉    | 206/346 [00:01<00:00, 152.06it/s]
 64%|██████▍   | 222/346 [00:01<00:00, 153.12it/s]
 69%|██████▉   | 239/346 [00:01<00:00, 156.18it/s]
 78%|███████▊  | 271/346 [00:01<00:00, 155.60it/s]
 83%|████████▎ | 287/346 [00:01<00:00, 154.58it/s]
 88%|████████▊ | 303/346 [00:02<00:00, 154.01it/s]
 92%|█████████▏| 319/346 [00:02<00:00, 154.73it/s]
 97%|█████████▋| 335/346 [00:02<00:00, 149.44it/s]
 62%|██████▏   | 61/99 [00:00<00:00,

[2m[36m(func pid=21900)[0m Epoch 00116: reducing learning rate of group 0 to 1.0039e-08.


  5%|▍         | 17/346 [00:00<00:01, 165.31it/s]
 10%|▉         | 34/346 [00:00<00:01, 156.72it/s]
 20%|█▉        | 68/346 [00:00<00:01, 159.97it/s]
 25%|██▍       | 85/346 [00:00<00:01, 159.50it/s]
 29%|██▉       | 102/346 [00:00<00:01, 161.36it/s]
 34%|███▍      | 119/346 [00:00<00:01, 159.08it/s]
 39%|███▉      | 135/346 [00:00<00:01, 158.73it/s]
 44%|████▍     | 152/346 [00:00<00:01, 159.92it/s]
 49%|████▊     | 168/346 [00:01<00:01, 157.96it/s]
 53%|█████▎    | 185/346 [00:01<00:01, 159.21it/s]
 63%|██████▎   | 219/346 [00:01<00:00, 161.02it/s]
 68%|██████▊   | 236/346 [00:01<00:00, 160.42it/s]
 73%|███████▎  | 253/346 [00:01<00:00, 158.59it/s]
 78%|███████▊  | 269/346 [00:01<00:00, 154.76it/s]
 82%|████████▏ | 285/346 [00:01<00:00, 151.14it/s]
 87%|████████▋ | 301/346 [00:01<00:00, 149.88it/s]
 92%|█████████▏| 317/346 [00:02<00:00, 147.53it/s]
 96%|█████████▌| 332/346 [00:02<00:00, 147.74it/s]
 64%|██████▎   | 63/99 [00:00<00:00, 616.10it/s]
100%|██████████| 99/99 [00:00<00:00, 

[2m[36m(func pid=3900)[0m Epoch 00033: reducing learning rate of group 0 to 4.1727e-04.


  4%|▍         | 15/346 [00:00<00:02, 141.40it/s]
  9%|▊         | 30/346 [00:00<00:02, 140.31it/s]
 13%|█▎        | 45/346 [00:00<00:02, 140.78it/s]
 17%|█▋        | 60/346 [00:00<00:02, 142.25it/s]
 22%|██▏       | 75/346 [00:00<00:01, 141.72it/s]
 26%|██▌       | 90/346 [00:00<00:01, 142.48it/s]
 30%|███       | 105/346 [00:00<00:01, 143.74it/s]
 35%|███▍      | 120/346 [00:00<00:01, 139.33it/s]
 39%|███▊      | 134/346 [00:00<00:01, 137.17it/s]
 43%|████▎     | 148/346 [00:01<00:01, 137.85it/s]
 47%|████▋     | 162/346 [00:01<00:01, 136.34it/s]
 51%|█████     | 176/346 [00:01<00:01, 130.76it/s]
 55%|█████▍    | 190/346 [00:01<00:01, 131.19it/s]
 59%|█████▉    | 204/346 [00:01<00:01, 131.40it/s]
 63%|██████▎   | 218/346 [00:01<00:00, 131.67it/s]
 67%|██████▋   | 232/346 [00:01<00:00, 133.32it/s]
 71%|███████   | 246/346 [00:01<00:00, 132.01it/s]
 75%|███████▌  | 260/346 [00:01<00:00, 132.15it/s]
 79%|███████▉  | 274/346 [00:02<00:00, 133.62it/s]
 83%|████████▎ | 288/346 [00:02<00:00

[2m[36m(func pid=3900)[0m Epoch 00048: reducing learning rate of group 0 to 2.0863e-04.


  9%|▊         | 30/346 [00:00<00:02, 137.94it/s]
 13%|█▎        | 44/346 [00:00<00:02, 136.05it/s]
 17%|█▋        | 58/346 [00:00<00:02, 126.55it/s]
 21%|██        | 73/346 [00:00<00:02, 132.43it/s]
 25%|██▌       | 87/346 [00:00<00:01, 133.27it/s]
 29%|██▉       | 101/346 [00:00<00:01, 132.89it/s]
 33%|███▎      | 115/346 [00:00<00:01, 134.21it/s]
 38%|███▊      | 130/346 [00:00<00:01, 136.21it/s]
 42%|████▏     | 145/346 [00:01<00:01, 137.41it/s]
 46%|████▌     | 159/346 [00:01<00:01, 137.19it/s]
 50%|█████     | 173/346 [00:01<00:01, 136.64it/s]
 54%|█████▍    | 188/346 [00:01<00:01, 138.03it/s]
 59%|█████▊    | 203/346 [00:01<00:01, 141.47it/s]
 67%|██████▋   | 233/346 [00:01<00:00, 143.08it/s]
 72%|███████▏  | 248/346 [00:01<00:00, 140.25it/s]
 76%|███████▌  | 263/346 [00:01<00:00, 140.93it/s]
 80%|████████  | 278/346 [00:02<00:00, 139.90it/s]
 85%|████████▍ | 293/346 [00:02<00:00, 141.38it/s]
 89%|████████▉ | 308/346 [00:02<00:00, 140.61it/s]
 93%|█████████▎| 323/346 [00:02<00:0

[2m[36m(func pid=3900)[0m Epoch 00060: reducing learning rate of group 0 to 1.0432e-04.


  4%|▍         | 15/346 [00:00<00:02, 143.87it/s]
  9%|▊         | 30/346 [00:00<00:02, 108.53it/s]
 12%|█▏        | 43/346 [00:00<00:02, 115.88it/s]
 16%|█▌        | 56/346 [00:00<00:02, 118.37it/s]
 20%|█▉        | 69/346 [00:00<00:02, 121.80it/s]
 24%|██▍       | 83/346 [00:00<00:02, 124.92it/s]
 28%|██▊       | 98/346 [00:00<00:01, 132.19it/s]
 33%|███▎      | 114/346 [00:00<00:01, 137.79it/s]
 38%|███▊      | 130/346 [00:00<00:01, 142.14it/s]
 42%|████▏     | 146/346 [00:01<00:01, 145.27it/s]
 47%|████▋     | 162/346 [00:01<00:01, 148.32it/s]
 51%|█████     | 177/346 [00:01<00:01, 146.88it/s]
 55%|█████▌    | 192/346 [00:01<00:01, 145.82it/s]
 60%|█████▉    | 207/346 [00:01<00:01, 138.95it/s]
 64%|██████▍   | 221/346 [00:01<00:00, 135.95it/s]
 68%|██████▊   | 235/346 [00:01<00:00, 134.95it/s]
 72%|███████▏  | 250/346 [00:01<00:00, 137.32it/s]
 77%|███████▋  | 266/346 [00:01<00:00, 142.21it/s]
 82%|████████▏ | 282/346 [00:02<00:00, 145.65it/s]
 86%|████████▌ | 297/346 [00:02<00:00,

[2m[36m(func pid=3900)[0m Epoch 00066: reducing learning rate of group 0 to 5.2158e-05.


  9%|▊         | 30/346 [00:00<00:02, 146.60it/s]
 13%|█▎        | 45/346 [00:00<00:02, 124.62it/s]
 17%|█▋        | 58/346 [00:00<00:02, 126.42it/s]
 21%|██        | 71/346 [00:00<00:02, 119.09it/s]
 24%|██▍       | 84/346 [00:00<00:02, 116.74it/s]
 28%|██▊       | 97/346 [00:00<00:02, 119.76it/s]
 32%|███▏      | 110/346 [00:00<00:01, 119.50it/s]
 36%|███▌      | 123/346 [00:01<00:01, 120.15it/s]
 39%|███▉      | 136/346 [00:01<00:01, 119.22it/s]
 43%|████▎     | 148/346 [00:01<00:01, 118.75it/s]
 47%|████▋     | 161/346 [00:01<00:01, 120.30it/s]
 50%|█████     | 174/346 [00:01<00:01, 119.66it/s]
 54%|█████▍    | 187/346 [00:01<00:01, 122.16it/s]
 58%|█████▊    | 200/346 [00:01<00:01, 123.10it/s]
 65%|██████▌   | 226/346 [00:01<00:00, 123.45it/s]
 69%|██████▉   | 239/346 [00:01<00:00, 122.80it/s]
 73%|███████▎  | 252/346 [00:02<00:00, 122.58it/s]
 77%|███████▋  | 265/346 [00:02<00:00, 123.85it/s]
 80%|████████  | 278/346 [00:02<00:00, 121.05it/s]
 84%|████████▍ | 291/346 [00:02<00:00

[2m[36m(func pid=3900)[0m Epoch 00087: reducing learning rate of group 0 to 2.6079e-05.


  3%|▎         | 12/346 [00:00<00:02, 115.52it/s]
  7%|▋         | 25/346 [00:00<00:02, 120.09it/s]
 11%|█         | 38/346 [00:00<00:02, 119.06it/s]
 15%|█▍        | 51/346 [00:00<00:02, 120.04it/s]
 18%|█▊        | 64/346 [00:00<00:02, 117.75it/s]
 22%|██▏       | 77/346 [00:00<00:02, 119.81it/s]
 26%|██▌       | 90/346 [00:00<00:02, 122.47it/s]
 30%|███       | 104/346 [00:00<00:01, 126.68it/s]
 34%|███▍      | 117/346 [00:00<00:01, 124.24it/s]
 38%|███▊      | 130/346 [00:01<00:01, 123.80it/s]
 45%|████▌     | 156/346 [00:01<00:01, 124.71it/s]
 49%|████▉     | 169/346 [00:01<00:01, 125.81it/s]
 53%|█████▎    | 182/346 [00:01<00:01, 122.68it/s]
 56%|█████▋    | 195/346 [00:01<00:01, 121.95it/s]
 60%|██████    | 208/346 [00:01<00:01, 120.57it/s]
 64%|██████▍   | 221/346 [00:01<00:01, 117.78it/s]
 68%|██████▊   | 234/346 [00:01<00:00, 118.90it/s]
 71%|███████▏  | 247/346 [00:02<00:00, 119.43it/s]
 75%|███████▌  | 260/346 [00:02<00:00, 122.36it/s]
 79%|███████▉  | 273/346 [00:02<00:00,

[2m[36m(func pid=3900)[0m Epoch 00100: reducing learning rate of group 0 to 1.3040e-05.


  8%|▊         | 28/346 [00:00<00:02, 133.62it/s]
 12%|█▏        | 42/346 [00:00<00:02, 134.70it/s]
 16%|█▋        | 57/346 [00:00<00:02, 136.76it/s]
 21%|██        | 72/346 [00:00<00:01, 140.50it/s]
 25%|██▌       | 87/346 [00:00<00:01, 143.61it/s]
 34%|███▍      | 119/346 [00:00<00:01, 148.34it/s]
 39%|███▊      | 134/346 [00:00<00:01, 147.59it/s]
 43%|████▎     | 149/346 [00:01<00:01, 144.01it/s]
 47%|████▋     | 164/346 [00:01<00:01, 143.24it/s]
 52%|█████▏    | 179/346 [00:01<00:01, 141.47it/s]
 56%|█████▋    | 195/346 [00:01<00:01, 145.59it/s]
 61%|██████    | 210/346 [00:01<00:00, 145.57it/s]
 65%|██████▌   | 226/346 [00:01<00:00, 147.96it/s]
 74%|███████▍  | 257/346 [00:01<00:00, 147.32it/s]
 79%|███████▉  | 273/346 [00:01<00:00, 148.55it/s]
 83%|████████▎ | 288/346 [00:01<00:00, 147.77it/s]
 88%|████████▊ | 303/346 [00:02<00:00, 145.23it/s]
 92%|█████████▏| 318/346 [00:02<00:00, 142.70it/s]
 96%|█████████▌| 333/346 [00:02<00:00, 141.15it/s]
100%|██████████| 346/346 [00:02<00:0

[2m[36m(func pid=3900)[0m Epoch 00106: reducing learning rate of group 0 to 6.5198e-06.


  4%|▍         | 15/346 [00:00<00:02, 145.44it/s]
  9%|▊         | 30/346 [00:00<00:02, 145.59it/s]
 13%|█▎        | 45/346 [00:00<00:02, 144.83it/s]
 22%|██▏       | 75/346 [00:00<00:01, 144.12it/s]
 26%|██▌       | 90/346 [00:00<00:01, 143.98it/s]
 30%|███       | 105/346 [00:00<00:01, 144.57it/s]
 35%|███▍      | 120/346 [00:00<00:01, 144.03it/s]
 39%|███▉      | 136/346 [00:00<00:01, 146.22it/s]
 44%|████▎     | 151/346 [00:01<00:01, 146.16it/s]
 48%|████▊     | 166/346 [00:01<00:01, 145.44it/s]
 52%|█████▏    | 181/346 [00:01<00:01, 141.82it/s]
 57%|█████▋    | 196/346 [00:01<00:01, 142.16it/s]
 61%|██████    | 211/346 [00:01<00:00, 141.88it/s]
 65%|██████▌   | 226/346 [00:01<00:00, 135.30it/s]
 69%|██████▉   | 240/346 [00:01<00:00, 135.02it/s]
 74%|███████▎  | 255/346 [00:01<00:00, 138.18it/s]
 78%|███████▊  | 270/346 [00:01<00:00, 140.86it/s]
 83%|████████▎ | 286/346 [00:02<00:00, 143.77it/s]
 87%|████████▋ | 301/346 [00:02<00:00, 144.72it/s]
 91%|█████████▏| 316/346 [00:02<00:0

[2m[36m(func pid=3900)[0m Epoch 00118: reducing learning rate of group 0 to 3.2599e-06.


  4%|▍         | 15/346 [00:00<00:02, 145.26it/s]
  9%|▊         | 30/346 [00:00<00:02, 141.53it/s]
 17%|█▋        | 60/346 [00:00<00:01, 145.73it/s]
 22%|██▏       | 75/346 [00:00<00:01, 144.87it/s]
 26%|██▌       | 90/346 [00:00<00:01, 137.40it/s]
 30%|███       | 104/346 [00:00<00:01, 136.83it/s]
 34%|███▍      | 118/346 [00:00<00:01, 126.04it/s]
 38%|███▊      | 132/346 [00:00<00:01, 128.13it/s]
 42%|████▏     | 146/346 [00:01<00:01, 129.76it/s]
 46%|████▌     | 160/346 [00:01<00:01, 132.18it/s]
 50%|█████     | 174/346 [00:01<00:01, 134.32it/s]
 54%|█████▍    | 188/346 [00:01<00:01, 134.72it/s]
 59%|█████▊    | 203/346 [00:01<00:01, 136.31it/s]
 63%|██████▎   | 217/346 [00:01<00:00, 135.05it/s]
 67%|██████▋   | 231/346 [00:01<00:00, 133.41it/s]
 71%|███████   | 245/346 [00:01<00:00, 132.44it/s]
 75%|███████▍  | 259/346 [00:01<00:00, 129.27it/s]
 79%|███████▊  | 272/346 [00:02<00:00, 125.04it/s]
 83%|████████▎ | 286/346 [00:02<00:00, 127.27it/s]
 87%|████████▋ | 300/346 [00:02<00:0

[2m[36m(func pid=3900)[0m Epoch 00124: reducing learning rate of group 0 to 1.6300e-06.


  4%|▍         | 14/346 [00:00<00:02, 138.42it/s]
  8%|▊         | 28/346 [00:00<00:02, 135.19it/s]
 12%|█▏        | 42/346 [00:00<00:02, 136.14it/s]
 21%|██        | 72/346 [00:00<00:01, 142.24it/s]
 25%|██▌       | 87/346 [00:00<00:01, 142.44it/s]
 29%|██▉       | 102/346 [00:00<00:01, 140.88it/s]
 34%|███▍      | 117/346 [00:00<00:01, 142.40it/s]
 38%|███▊      | 132/346 [00:00<00:01, 143.00it/s]
 43%|████▎     | 148/346 [00:01<00:01, 145.63it/s]
 47%|████▋     | 163/346 [00:01<00:01, 145.37it/s]
 56%|█████▌    | 193/346 [00:01<00:01, 145.74it/s]
 60%|██████    | 208/346 [00:01<00:00, 146.32it/s]
 64%|██████▍   | 223/346 [00:01<00:00, 146.57it/s]
 69%|██████▉   | 238/346 [00:01<00:00, 145.98it/s]
 73%|███████▎  | 253/346 [00:01<00:00, 143.46it/s]
 77%|███████▋  | 268/346 [00:01<00:00, 143.58it/s]
 82%|████████▏ | 283/346 [00:01<00:00, 140.62it/s]
 86%|████████▌ | 298/346 [00:02<00:00, 141.95it/s]
 90%|█████████ | 313/346 [00:02<00:00, 139.50it/s]
100%|██████████| 346/346 [00:02<00:0

[2m[36m(func pid=3900)[0m Epoch 00137: reducing learning rate of group 0 to 8.1498e-07.


  4%|▍         | 14/346 [00:00<00:02, 139.93it/s]
 12%|█▏        | 43/346 [00:00<00:02, 142.50it/s]
 17%|█▋        | 58/346 [00:00<00:02, 142.54it/s]
 21%|██        | 73/346 [00:00<00:01, 141.71it/s]
 25%|██▌       | 88/346 [00:00<00:01, 143.97it/s]
 30%|██▉       | 103/346 [00:00<00:01, 144.42it/s]
 34%|███▍      | 118/346 [00:00<00:01, 143.64it/s]
 38%|███▊      | 133/346 [00:00<00:01, 144.70it/s]
 43%|████▎     | 149/346 [00:01<00:01, 146.74it/s]
 52%|█████▏    | 179/346 [00:01<00:01, 144.74it/s]
 56%|█████▌    | 194/346 [00:01<00:01, 144.15it/s]
 60%|██████    | 209/346 [00:01<00:00, 140.96it/s]
 65%|██████▍   | 224/346 [00:01<00:00, 139.36it/s]
 69%|██████▉   | 239/346 [00:01<00:00, 140.91it/s]
 73%|███████▎  | 254/346 [00:01<00:00, 141.15it/s]
 78%|███████▊  | 269/346 [00:01<00:00, 140.86it/s]
 82%|████████▏ | 284/346 [00:01<00:00, 142.97it/s]
 86%|████████▋ | 299/346 [00:02<00:00, 143.50it/s]
 95%|█████████▌| 329/346 [00:02<00:00, 143.48it/s]
  0%|          | 0/99 [00:00<?, ?it/

[2m[36m(func pid=3900)[0m Epoch 00143: reducing learning rate of group 0 to 4.0749e-07.


  8%|▊         | 29/346 [00:00<00:02, 145.36it/s]
 13%|█▎        | 44/346 [00:00<00:02, 144.85it/s]
 17%|█▋        | 59/346 [00:00<00:01, 146.79it/s]
 21%|██▏       | 74/346 [00:00<00:01, 147.47it/s]
 26%|██▌       | 89/346 [00:00<00:01, 146.90it/s]
 30%|███       | 104/346 [00:00<00:01, 144.35it/s]
 34%|███▍      | 119/346 [00:00<00:01, 145.02it/s]
 43%|████▎     | 150/346 [00:01<00:01, 147.15it/s]
 48%|████▊     | 165/346 [00:01<00:01, 148.00it/s]
 52%|█████▏    | 180/346 [00:01<00:01, 145.55it/s]
 56%|█████▋    | 195/346 [00:01<00:01, 145.60it/s]
 61%|██████    | 211/346 [00:01<00:00, 147.67it/s]
 65%|██████▌   | 226/346 [00:01<00:00, 145.77it/s]
 70%|██████▉   | 241/346 [00:01<00:00, 144.79it/s]
 74%|███████▍  | 256/346 [00:01<00:00, 144.32it/s]
 78%|███████▊  | 271/346 [00:01<00:00, 144.11it/s]
 83%|████████▎ | 286/346 [00:01<00:00, 145.11it/s]
 87%|████████▋ | 301/346 [00:02<00:00, 143.57it/s]
 92%|█████████▏| 317/346 [00:02<00:00, 146.28it/s]
 96%|█████████▌| 332/346 [00:02<00:0

[2m[36m(func pid=3900)[0m Epoch 00149: reducing learning rate of group 0 to 2.0374e-07.


  4%|▍         | 14/346 [00:00<00:02, 135.49it/s]
  8%|▊         | 28/346 [00:00<00:02, 135.92it/s]
 12%|█▏        | 42/346 [00:00<00:02, 137.14it/s]
 16%|█▋        | 57/346 [00:00<00:02, 141.65it/s]
 21%|██        | 73/346 [00:00<00:01, 145.53it/s]
 25%|██▌       | 88/346 [00:00<00:01, 146.62it/s]
 30%|██▉       | 103/346 [00:00<00:01, 146.71it/s]
 34%|███▍      | 118/346 [00:00<00:01, 146.30it/s]
 38%|███▊      | 133/346 [00:00<00:01, 145.27it/s]
 43%|████▎     | 148/346 [00:01<00:01, 144.04it/s]
 47%|████▋     | 163/346 [00:01<00:01, 144.21it/s]
 52%|█████▏    | 179/346 [00:01<00:01, 145.49it/s]
 56%|█████▋    | 195/346 [00:01<00:01, 147.88it/s]
 61%|██████    | 210/346 [00:01<00:00, 148.49it/s]
 65%|██████▌   | 226/346 [00:01<00:00, 150.77it/s]
 70%|██████▉   | 242/346 [00:01<00:00, 148.43it/s]
 75%|███████▍  | 258/346 [00:01<00:00, 149.65it/s]
 79%|███████▉  | 273/346 [00:01<00:00, 149.25it/s]
 84%|████████▎ | 289/346 [00:01<00:00, 150.12it/s]
 88%|████████▊ | 305/346 [00:02<00:00

[2m[36m(func pid=23240)[0m Epoch 00026: reducing learning rate of group 0 to 3.8013e-04.


  3%|▎         | 11/346 [00:00<00:03, 108.17it/s]
  7%|▋         | 23/346 [00:00<00:02, 111.89it/s]
 10%|█         | 35/346 [00:00<00:03, 102.13it/s]
 13%|█▎        | 46/346 [00:00<00:02, 104.32it/s]
 17%|█▋        | 58/346 [00:00<00:02, 107.36it/s]
 20%|██        | 70/346 [00:00<00:02, 109.04it/s]
 24%|██▎       | 82/346 [00:00<00:02, 110.39it/s]
 27%|██▋       | 94/346 [00:00<00:02, 109.57it/s]
 31%|███       | 106/346 [00:00<00:02, 110.31it/s]
 34%|███▍      | 118/346 [00:01<00:02, 110.95it/s]
 38%|███▊      | 130/346 [00:01<00:01, 112.02it/s]
 41%|████      | 142/346 [00:01<00:01, 112.82it/s]
 45%|████▍     | 154/346 [00:01<00:01, 112.80it/s]
 48%|████▊     | 166/346 [00:01<00:01, 113.23it/s]
 51%|█████▏    | 178/346 [00:01<00:01, 113.32it/s]
 55%|█████▍    | 190/346 [00:01<00:01, 113.02it/s]
 58%|█████▊    | 202/346 [00:01<00:01, 112.32it/s]
 62%|██████▏   | 214/346 [00:01<00:01, 112.61it/s]
 65%|██████▌   | 226/346 [00:02<00:01, 111.54it/s]
 69%|██████▉   | 238/346 [00:02<00:00, 

[2m[36m(func pid=23240)[0m Epoch 00033: reducing learning rate of group 0 to 1.9006e-04.


  3%|▎         | 12/346 [00:00<00:02, 117.79it/s]
  7%|▋         | 24/346 [00:00<00:02, 117.69it/s]
 10%|█         | 36/346 [00:00<00:02, 118.11it/s]
 14%|█▍        | 48/346 [00:00<00:02, 116.92it/s]
 17%|█▋        | 60/346 [00:00<00:02, 116.08it/s]
 21%|██        | 73/346 [00:00<00:02, 118.64it/s]
 25%|██▍       | 85/346 [00:00<00:02, 118.84it/s]
 28%|██▊       | 98/346 [00:00<00:02, 120.42it/s]
 32%|███▏      | 111/346 [00:00<00:01, 119.72it/s]
 36%|███▌      | 124/346 [00:01<00:01, 120.33it/s]
 40%|███▉      | 137/346 [00:01<00:01, 119.63it/s]
 43%|████▎     | 150/346 [00:01<00:01, 120.54it/s]
 47%|████▋     | 163/346 [00:01<00:01, 122.94it/s]
 51%|█████     | 176/346 [00:01<00:01, 122.86it/s]
 55%|█████▍    | 189/346 [00:01<00:01, 123.83it/s]
 58%|█████▊    | 202/346 [00:01<00:01, 123.07it/s]
 62%|██████▏   | 215/346 [00:01<00:01, 124.37it/s]
 66%|██████▌   | 228/346 [00:01<00:00, 123.02it/s]
 70%|██████▉   | 241/346 [00:01<00:00, 120.31it/s]
 73%|███████▎  | 254/346 [00:02<00:00, 

[2m[36m(func pid=23240)[0m Epoch 00050: reducing learning rate of group 0 to 9.5032e-05.


  3%|▎         | 12/346 [00:00<00:02, 119.51it/s]
  7%|▋         | 24/346 [00:00<00:02, 112.80it/s]
 11%|█         | 37/346 [00:00<00:02, 116.84it/s]
 14%|█▍        | 50/346 [00:00<00:02, 120.03it/s]
 18%|█▊        | 63/346 [00:00<00:02, 120.35it/s]
 25%|██▌       | 88/346 [00:00<00:02, 115.06it/s]
 29%|██▉       | 100/346 [00:00<00:02, 114.84it/s]
 32%|███▏      | 112/346 [00:00<00:02, 115.75it/s]
 36%|███▌      | 124/346 [00:01<00:01, 116.23it/s]
 39%|███▉      | 136/346 [00:01<00:01, 113.69it/s]
 43%|████▎     | 148/346 [00:01<00:01, 113.63it/s]
 46%|████▌     | 160/346 [00:01<00:01, 112.79it/s]
 50%|████▉     | 172/346 [00:01<00:01, 114.22it/s]
 53%|█████▎    | 184/346 [00:01<00:01, 114.55it/s]
 57%|█████▋    | 197/346 [00:01<00:01, 117.37it/s]
 60%|██████    | 209/346 [00:01<00:01, 114.75it/s]
 64%|██████▍   | 221/346 [00:01<00:01, 111.16it/s]
 67%|██████▋   | 233/346 [00:02<00:01, 109.33it/s]
 71%|███████   | 245/346 [00:02<00:00, 110.45it/s]
 74%|███████▍  | 257/346 [00:02<00:00

[2m[36m(func pid=23240)[0m Epoch 00056: reducing learning rate of group 0 to 4.7516e-05.


  3%|▎         | 12/346 [00:00<00:02, 118.83it/s]
  7%|▋         | 25/346 [00:00<00:02, 123.33it/s]
 11%|█         | 38/346 [00:00<00:02, 123.02it/s]
 15%|█▍        | 51/346 [00:00<00:02, 123.22it/s]
 18%|█▊        | 64/346 [00:00<00:02, 123.89it/s]
 22%|██▏       | 77/346 [00:00<00:02, 123.40it/s]
 26%|██▌       | 90/346 [00:00<00:02, 122.08it/s]
 30%|██▉       | 103/346 [00:00<00:02, 121.15it/s]
 34%|███▎      | 116/346 [00:00<00:01, 119.45it/s]
 37%|███▋      | 128/346 [00:01<00:01, 119.37it/s]
 41%|████      | 141/346 [00:01<00:01, 120.66it/s]
 45%|████▍     | 154/346 [00:01<00:01, 121.67it/s]
 48%|████▊     | 167/346 [00:01<00:01, 122.63it/s]
 52%|█████▏    | 180/346 [00:01<00:01, 122.20it/s]
 56%|█████▌    | 193/346 [00:01<00:01, 121.63it/s]
 60%|█████▉    | 206/346 [00:01<00:01, 122.70it/s]
 63%|██████▎   | 219/346 [00:01<00:01, 123.03it/s]
 67%|██████▋   | 232/346 [00:01<00:00, 123.56it/s]
 71%|███████   | 245/346 [00:02<00:00, 123.75it/s]
 75%|███████▍  | 258/346 [00:02<00:00,

[2m[36m(func pid=23240)[0m Epoch 00062: reducing learning rate of group 0 to 2.3758e-05.


  0%|          | 0/346 [00:00<?, ?it/s]
  4%|▍         | 13/346 [00:00<00:02, 123.62it/s]
  8%|▊         | 26/346 [00:00<00:02, 123.17it/s]
 11%|█▏        | 39/346 [00:00<00:02, 122.77it/s]
 15%|█▌        | 53/346 [00:00<00:02, 125.68it/s]
 19%|█▉        | 66/346 [00:00<00:02, 119.11it/s]
 26%|██▌       | 90/346 [00:00<00:02, 115.50it/s]
 29%|██▉       | 102/346 [00:00<00:02, 112.52it/s]
 33%|███▎      | 114/346 [00:00<00:02, 113.08it/s]
 37%|███▋      | 127/346 [00:01<00:01, 117.95it/s]
 41%|████      | 141/346 [00:01<00:01, 122.21it/s]
 45%|████▍     | 154/346 [00:01<00:01, 122.09it/s]
 48%|████▊     | 167/346 [00:01<00:01, 118.45it/s]
 52%|█████▏    | 179/346 [00:01<00:01, 116.99it/s]
 55%|█████▌    | 191/346 [00:01<00:01, 117.76it/s]
 59%|█████▉    | 204/346 [00:01<00:01, 119.30it/s]
 63%|██████▎   | 217/346 [00:01<00:01, 121.44it/s]
 66%|██████▋   | 230/346 [00:01<00:00, 123.82it/s]
 70%|███████   | 243/346 [00:02<00:00, 125.57it/s]
 74%|███████▍  | 256/346 [00:02<00:00, 125.43it/

[2m[36m(func pid=23240)[0m Epoch 00071: reducing learning rate of group 0 to 1.1879e-05.


  8%|▊         | 26/346 [00:00<00:02, 122.18it/s]
 11%|█▏        | 39/346 [00:00<00:02, 118.36it/s]
 15%|█▌        | 52/346 [00:00<00:02, 119.57it/s]
 18%|█▊        | 64/346 [00:00<00:02, 112.00it/s]
 22%|██▏       | 76/346 [00:00<00:02, 110.07it/s]
 25%|██▌       | 88/346 [00:00<00:02, 111.35it/s]
 29%|██▉       | 100/346 [00:00<00:02, 110.30it/s]
 32%|███▏      | 112/346 [00:00<00:02, 110.18it/s]
 36%|███▌      | 124/346 [00:01<00:01, 111.21it/s]
 39%|███▉      | 136/346 [00:01<00:02, 104.95it/s]
 42%|████▏     | 147/346 [00:01<00:01, 101.89it/s]
 46%|████▌     | 158/346 [00:01<00:01, 96.87it/s] 
 49%|████▊     | 168/346 [00:01<00:01, 96.47it/s]
 51%|█████▏    | 178/346 [00:01<00:01, 97.18it/s]
 55%|█████▍    | 190/346 [00:01<00:01, 102.52it/s]
 58%|█████▊    | 202/346 [00:01<00:01, 106.65it/s]
 62%|██████▏   | 213/346 [00:01<00:01, 104.98it/s]
 65%|██████▌   | 225/346 [00:02<00:01, 108.35it/s]
 68%|██████▊   | 237/346 [00:02<00:00, 109.24it/s]
 72%|███████▏  | 248/346 [00:02<00:00, 

[2m[36m(func pid=23240)[0m Epoch 00077: reducing learning rate of group 0 to 5.9395e-06.


  6%|▋         | 22/346 [00:00<00:03, 101.38it/s]
 10%|▉         | 33/346 [00:00<00:02, 105.13it/s]
 13%|█▎        | 45/346 [00:00<00:02, 108.71it/s]
 16%|█▌        | 56/346 [00:00<00:02, 107.29it/s]
 19%|█▉        | 67/346 [00:00<00:02, 104.11it/s]
 23%|██▎       | 79/346 [00:00<00:02, 105.44it/s]
 26%|██▌       | 90/346 [00:00<00:02, 101.85it/s]
 29%|██▉       | 101/346 [00:00<00:02, 100.77it/s]
 33%|███▎      | 113/346 [00:01<00:02, 104.79it/s]
 36%|███▌      | 124/346 [00:01<00:02, 103.02it/s]
 39%|███▉      | 136/346 [00:01<00:01, 106.87it/s]
 42%|████▏     | 147/346 [00:01<00:01, 104.87it/s]
 46%|████▌     | 158/346 [00:01<00:01, 103.60it/s]
 49%|████▉     | 170/346 [00:01<00:01, 106.12it/s]
 52%|█████▏    | 181/346 [00:01<00:01, 105.49it/s]
 55%|█████▌    | 192/346 [00:01<00:01, 106.35it/s]
 59%|█████▉    | 205/346 [00:01<00:01, 111.42it/s]
 63%|██████▎   | 218/346 [00:02<00:01, 115.11it/s]
 67%|██████▋   | 231/346 [00:02<00:00, 117.97it/s]
 71%|███████   | 244/346 [00:02<00:00,

[2m[36m(func pid=23240)[0m Epoch 00092: reducing learning rate of group 0 to 2.9697e-06.


  3%|▎         | 11/346 [00:00<00:03, 105.57it/s]
  7%|▋         | 23/346 [00:00<00:02, 108.74it/s]
 10%|▉         | 34/346 [00:00<00:02, 109.03it/s]
 13%|█▎        | 46/346 [00:00<00:02, 110.66it/s]
 17%|█▋        | 58/346 [00:00<00:02, 109.39it/s]
 24%|██▎       | 82/346 [00:00<00:02, 113.04it/s]
 27%|██▋       | 94/346 [00:00<00:02, 112.53it/s]
 31%|███       | 106/346 [00:00<00:02, 111.64it/s]
 34%|███▍      | 118/346 [00:01<00:02, 110.86it/s]
 38%|███▊      | 130/346 [00:01<00:01, 108.48it/s]
 41%|████      | 142/346 [00:01<00:01, 109.95it/s]
 45%|████▍     | 154/346 [00:01<00:01, 112.43it/s]
 48%|████▊     | 166/346 [00:01<00:01, 114.33it/s]
 51%|█████▏    | 178/346 [00:01<00:01, 113.36it/s]
 55%|█████▍    | 190/346 [00:01<00:01, 114.60it/s]
 58%|█████▊    | 202/346 [00:01<00:01, 115.34it/s]
 62%|██████▏   | 215/346 [00:01<00:01, 117.97it/s]
 66%|██████▌   | 227/346 [00:02<00:01, 117.27it/s]
 69%|██████▉   | 239/346 [00:02<00:00, 117.05it/s]
 73%|███████▎  | 251/346 [00:02<00:00,

[2m[36m(func pid=23240)[0m Epoch 00104: reducing learning rate of group 0 to 1.4849e-06.


  3%|▎         | 11/346 [00:00<00:03, 106.74it/s]
  6%|▋         | 22/346 [00:00<00:03, 107.32it/s]
 10%|▉         | 33/346 [00:00<00:02, 106.69it/s]
 13%|█▎        | 44/346 [00:00<00:02, 106.69it/s]
 16%|█▌        | 55/346 [00:00<00:02, 101.07it/s]
 19%|█▉        | 66/346 [00:00<00:02, 98.19it/s] 
 22%|██▏       | 76/346 [00:00<00:02, 94.81it/s]
 25%|██▍       | 86/346 [00:00<00:02, 95.25it/s]
 28%|██▊       | 97/346 [00:00<00:02, 97.83it/s]
 31%|███       | 108/346 [00:01<00:02, 99.58it/s]
 34%|███▍      | 119/346 [00:01<00:02, 101.48it/s]
 38%|███▊      | 130/346 [00:01<00:02, 100.60it/s]
 41%|████      | 141/346 [00:01<00:02, 101.69it/s]
 44%|████▍     | 152/346 [00:01<00:01, 102.76it/s]
 47%|████▋     | 164/346 [00:01<00:01, 106.33it/s]
 51%|█████     | 176/346 [00:01<00:01, 109.02it/s]
 54%|█████▍    | 188/346 [00:01<00:01, 110.56it/s]
 58%|█████▊    | 200/346 [00:01<00:01, 101.83it/s]
 61%|██████    | 211/346 [00:02<00:01, 101.66it/s]
 64%|██████▍   | 222/346 [00:02<00:01, 100.5

[2m[36m(func pid=23240)[0m Epoch 00121: reducing learning rate of group 0 to 7.4244e-07.


  3%|▎         | 11/346 [00:00<00:03, 101.28it/s]
  6%|▋         | 22/346 [00:00<00:03, 96.42it/s] 
  9%|▉         | 32/346 [00:00<00:03, 88.81it/s]
 12%|█▏        | 41/346 [00:00<00:03, 88.04it/s]
 15%|█▍        | 51/346 [00:00<00:03, 91.41it/s]
 18%|█▊        | 62/346 [00:00<00:02, 94.70it/s]
 21%|██        | 73/346 [00:00<00:02, 95.84it/s]
 27%|██▋       | 95/346 [00:00<00:02, 99.03it/s]
 30%|███       | 105/346 [00:01<00:02, 98.49it/s]
 33%|███▎      | 115/346 [00:01<00:02, 91.67it/s]
 36%|███▌      | 125/346 [00:01<00:02, 90.49it/s]
 39%|███▉      | 135/346 [00:01<00:02, 91.33it/s]
 42%|████▏     | 145/346 [00:01<00:02, 93.31it/s]
 45%|████▌     | 156/346 [00:01<00:01, 96.69it/s]
 51%|█████▏    | 178/346 [00:01<00:01, 99.31it/s]
 54%|█████▍    | 188/346 [00:01<00:01, 98.48it/s]
 58%|█████▊    | 199/346 [00:02<00:01, 100.78it/s]
 61%|██████    | 210/346 [00:02<00:01, 98.14it/s] 
 64%|██████▎   | 220/346 [00:02<00:01, 98.08it/s]
 67%|██████▋   | 231/346 [00:02<00:01, 99.00it/s]
 70%

[2m[36m(func pid=23240)[0m Epoch 00132: reducing learning rate of group 0 to 3.7122e-07.


  3%|▎         | 11/346 [00:00<00:03, 106.63it/s]
  6%|▋         | 22/346 [00:00<00:02, 108.15it/s]
 13%|█▎        | 44/346 [00:00<00:02, 107.46it/s]
 16%|█▌        | 56/346 [00:00<00:02, 109.53it/s]
 20%|█▉        | 68/346 [00:00<00:02, 110.89it/s]
 23%|██▎       | 80/346 [00:00<00:02, 109.00it/s]
 26%|██▋       | 91/346 [00:00<00:02, 108.56it/s]
 29%|██▉       | 102/346 [00:00<00:02, 105.95it/s]
 33%|███▎      | 113/346 [00:01<00:02, 106.38it/s]
 36%|███▌      | 124/346 [00:01<00:02, 106.50it/s]
 43%|████▎     | 148/346 [00:01<00:01, 110.39it/s]
 46%|████▌     | 160/346 [00:01<00:01, 111.47it/s]
 50%|████▉     | 172/346 [00:01<00:01, 113.62it/s]
 53%|█████▎    | 184/346 [00:01<00:01, 114.83it/s]
 57%|█████▋    | 196/346 [00:01<00:01, 113.93it/s]
 60%|██████    | 209/346 [00:01<00:01, 116.64it/s]
 64%|██████▍   | 221/346 [00:01<00:01, 116.07it/s]
 67%|██████▋   | 233/346 [00:02<00:00, 116.08it/s]
 71%|███████   | 245/346 [00:02<00:00, 113.57it/s]
 74%|███████▍  | 257/346 [00:02<00:00,

[2m[36m(func pid=23240)[0m Epoch 00138: reducing learning rate of group 0 to 1.8561e-07.


  6%|▌         | 20/346 [00:00<00:03, 96.63it/s]
  9%|▊         | 30/346 [00:00<00:03, 96.35it/s]
 12%|█▏        | 41/346 [00:00<00:03, 99.72it/s]
 15%|█▍        | 51/346 [00:00<00:02, 98.54it/s]
 18%|█▊        | 61/346 [00:00<00:02, 97.31it/s]
 21%|██        | 71/346 [00:00<00:02, 96.14it/s]
 23%|██▎       | 81/346 [00:00<00:02, 95.82it/s]
 27%|██▋       | 92/346 [00:00<00:02, 96.58it/s]
 30%|██▉       | 103/346 [00:01<00:02, 98.45it/s]
 33%|███▎      | 114/346 [00:01<00:02, 100.05it/s]
 36%|███▌      | 125/346 [00:01<00:02, 100.94it/s]
 39%|███▉      | 136/346 [00:01<00:02, 101.76it/s]
 42%|████▏     | 147/346 [00:01<00:01, 103.04it/s]
 46%|████▌     | 158/346 [00:01<00:01, 102.23it/s]
 49%|████▉     | 169/346 [00:01<00:01, 102.73it/s]
 52%|█████▏    | 180/346 [00:01<00:01, 102.58it/s]
 55%|█████▌    | 191/346 [00:01<00:01, 103.50it/s]
 58%|█████▊    | 202/346 [00:02<00:01, 103.37it/s]
 62%|██████▏   | 213/346 [00:02<00:01, 103.44it/s]
 65%|██████▍   | 224/346 [00:02<00:01, 101.20it/

[2m[36m(func pid=23240)[0m Epoch 00144: reducing learning rate of group 0 to 9.2805e-08.


  4%|▍         | 13/346 [00:00<00:02, 121.29it/s]
  8%|▊         | 26/346 [00:00<00:02, 116.50it/s]
 11%|█         | 38/346 [00:00<00:02, 114.28it/s]
 14%|█▍        | 50/346 [00:00<00:02, 114.52it/s]
 18%|█▊        | 62/346 [00:00<00:02, 116.35it/s]
 21%|██▏       | 74/346 [00:00<00:02, 116.48it/s]
 25%|██▌       | 87/346 [00:00<00:02, 117.73it/s]
 29%|██▉       | 100/346 [00:00<00:02, 118.61it/s]
 32%|███▏      | 112/346 [00:00<00:01, 118.86it/s]
 36%|███▌      | 124/346 [00:01<00:01, 117.55it/s]
 40%|███▉      | 137/346 [00:01<00:01, 118.78it/s]
 43%|████▎     | 149/346 [00:01<00:01, 115.44it/s]
 47%|████▋     | 161/346 [00:01<00:01, 116.46it/s]
 50%|█████     | 173/346 [00:01<00:01, 115.14it/s]
 53%|█████▎    | 185/346 [00:01<00:01, 112.55it/s]
 57%|█████▋    | 197/346 [00:01<00:01, 113.75it/s]
 60%|██████    | 209/346 [00:01<00:01, 112.31it/s]
 64%|██████▍   | 221/346 [00:01<00:01, 111.02it/s]
 67%|██████▋   | 233/346 [00:02<00:01, 111.93it/s]
 71%|███████   | 245/346 [00:02<00:00,

[2m[36m(func pid=23240)[0m Epoch 00150: reducing learning rate of group 0 to 4.6402e-08.


100%|██████████| 50/50 [00:00<00:00, 477.89it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
  1%|          | 1/173 [00:01<05:08,  1.79s/it]
 13%|█▎        | 22/173 [00:01<00:09, 15.97it/s]
 25%|██▌       | 44/173 [00:01<00:03, 35.28it/s]
 38%|███▊      | 66/173 [00:02<00:01, 57.21it/s]
 50%|█████     | 87/173 [00:02<00:01, 79.06it/s]
 62%|██████▏   | 108/173 [00:02<00:00, 101.47it/s]
 75%|███████▍  | 129/173 [00:02<00:00, 122.13it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 495.41it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
  8%|▊         | 13/173 [00:00<00:01, 127.23it/s]
 18%|█▊        | 32/173 [00:00<00:00, 160.53it/s]
 30%|███       | 52/173 [00:00<00:00, 176.74it/s]
 42%|████▏     | 72/173 [00:00<00:00, 184.34it/s]
 54%|█████▍    | 93/173 [00:00<00:00, 192.62it/s]
 66%|██████▌   | 114/173 [00:00<00:00, 196.53it/s]
 78%|███████▊  | 135/173 [00:00<00:00, 200.81it/s]
 91%|█████████ | 157/173 [00:00<00:00, 206.21it/s]
100%|██████████| 50/50 [00:00<00:0

[2m[36m(func pid=14196)[0m Epoch 00034: reducing learning rate of group 0 to 5.2884e-05.


 24%|██▍       | 42/173 [00:00<00:00, 206.46it/s]
 36%|███▋      | 63/173 [00:00<00:00, 198.85it/s]
 49%|████▊     | 84/173 [00:00<00:00, 198.61it/s]
 61%|██████    | 105/173 [00:00<00:00, 199.92it/s]
 73%|███████▎  | 126/173 [00:00<00:00, 202.48it/s]
 85%|████████▍ | 147/173 [00:00<00:00, 198.54it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
 92%|█████████▏| 46/50 [00:00<00:00, 459.40it/s]
100%|██████████| 50/50 [00:00<00:00, 450.61it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
  9%|▊         | 15/173 [00:00<00:01, 144.23it/s]
 17%|█▋        | 30/173 [00:00<00:00, 146.62it/s]
 28%|██▊       | 49/173 [00:00<00:00, 166.06it/s]
 40%|███▉      | 69/173 [00:00<00:00, 176.06it/s]
 50%|█████     | 87/173 [00:00<00:00, 176.26it/s]
 61%|██████    | 105/173 [00:00<00:00, 170.58it/s]
 72%|███████▏  | 125/173 [00:00<00:00, 176.83it/s]
 83%|████████▎ | 144/173 [00:00<00:00, 180.51it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 258.49it/s]
  0%|          | 0/173 [00:00

[2m[36m(func pid=14196)[0m Epoch 00040: reducing learning rate of group 0 to 2.6442e-05.


  0%|          | 0/173 [00:00<?, ?it/s]
  5%|▌         | 9/173 [00:00<00:01, 87.59it/s]
 16%|█▌        | 27/173 [00:00<00:01, 135.66it/s]
 27%|██▋       | 46/173 [00:00<00:00, 156.89it/s]
 38%|███▊      | 66/173 [00:00<00:00, 170.88it/s]
 50%|████▉     | 86/173 [00:00<00:00, 180.18it/s]
 62%|██████▏   | 107/173 [00:00<00:00, 187.28it/s]
 73%|███████▎  | 127/173 [00:00<00:00, 190.71it/s]
 86%|████████▌ | 148/173 [00:00<00:00, 194.41it/s]
 97%|█████████▋| 168/173 [00:00<00:00, 193.95it/s]
100%|██████████| 173/173 [00:00<00:00, 180.73it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 480.60it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
  9%|▊         | 15/173 [00:00<00:01, 144.01it/s]
 17%|█▋        | 30/173 [00:00<00:01, 100.82it/s]
 27%|██▋       | 46/173 [00:00<00:01, 119.63it/s]
 35%|███▍      | 60/173 [00:00<00:00, 125.09it/s]
 45%|████▍     | 77/173 [00:00<00:00, 138.30it/s]
 55%|█████▍    | 95/173 [00:00<00:00, 149.10it/s]
 65%|██████▍   | 112/173 [00:

[2m[36m(func pid=14196)[0m Epoch 00046: reducing learning rate of group 0 to 1.3221e-05.


 12%|█▏        | 20/173 [00:00<00:00, 187.58it/s]
 23%|██▎       | 40/173 [00:00<00:00, 193.90it/s]
 35%|███▍      | 60/173 [00:00<00:00, 140.58it/s]
 46%|████▌     | 80/173 [00:00<00:00, 156.45it/s]
 58%|█████▊    | 100/173 [00:00<00:00, 169.72it/s]
 70%|██████▉   | 121/173 [00:00<00:00, 179.76it/s]
 94%|█████████▍| 163/173 [00:00<00:00, 190.96it/s]
100%|██████████| 173/173 [00:00<00:00, 179.69it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 509.25it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
  9%|▉         | 16/173 [00:00<00:00, 159.75it/s]
 18%|█▊        | 32/173 [00:00<00:00, 153.64it/s]
 29%|██▉       | 51/173 [00:00<00:00, 168.44it/s]
 40%|████      | 70/173 [00:00<00:00, 173.96it/s]
 52%|█████▏    | 90/173 [00:00<00:00, 180.11it/s]
 63%|██████▎   | 109/173 [00:00<00:00, 182.77it/s]
 75%|███████▍  | 129/173 [00:00<00:00, 187.07it/s]
 87%|████████▋ | 151/173 [00:00<00:00, 194.91it/s]
 99%|█████████▉| 172/173 [00:00<00:00, 198.21it/s]
100%|█████████

[2m[36m(func pid=14196)[0m Epoch 00052: reducing learning rate of group 0 to 6.6104e-06.


 12%|█▏        | 20/173 [00:00<00:00, 199.55it/s]
 24%|██▎       | 41/173 [00:00<00:00, 203.83it/s]
 36%|███▌      | 62/173 [00:00<00:00, 200.86it/s]
 48%|████▊     | 83/173 [00:00<00:00, 199.05it/s]
 60%|██████    | 104/173 [00:00<00:00, 202.79it/s]
 72%|███████▏  | 125/173 [00:00<00:00, 202.29it/s]
 85%|████████▍ | 147/173 [00:00<00:00, 205.67it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 481.36it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
 10%|█         | 18/173 [00:00<00:00, 176.20it/s]
 23%|██▎       | 39/173 [00:00<00:00, 194.47it/s]
 35%|███▍      | 60/173 [00:00<00:00, 195.61it/s]
 46%|████▌     | 80/173 [00:00<00:00, 197.01it/s]
 58%|█████▊    | 100/173 [00:00<00:00, 195.37it/s]
 69%|██████▉   | 120/173 [00:00<00:00, 196.37it/s]
 81%|████████  | 140/173 [00:00<00:00, 186.74it/s]
100%|██████████| 173/173 [00:00<00:00, 188.15it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 470.68it/s]
  0%|          | 0/173 [00:

[2m[36m(func pid=14196)[0m Epoch 00058: reducing learning rate of group 0 to 3.3052e-06.


  0%|          | 0/173 [00:00<?, ?it/s]
 16%|█▌        | 28/173 [00:00<00:01, 138.85it/s]
 28%|██▊       | 48/173 [00:00<00:00, 163.53it/s]
 39%|███▊      | 67/173 [00:00<00:00, 172.35it/s]
 51%|█████     | 88/173 [00:00<00:00, 184.18it/s]
 63%|██████▎   | 109/173 [00:00<00:00, 192.16it/s]
 76%|███████▌  | 131/173 [00:00<00:00, 199.16it/s]
 88%|████████▊ | 152/173 [00:00<00:00, 200.24it/s]
100%|██████████| 173/173 [00:00<00:00, 186.27it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 521.51it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
 12%|█▏        | 20/173 [00:00<00:00, 198.08it/s]
 23%|██▎       | 40/173 [00:00<00:00, 198.04it/s]
 36%|███▌      | 62/173 [00:00<00:00, 205.32it/s]
 48%|████▊     | 83/173 [00:00<00:00, 204.81it/s]
 61%|██████    | 105/173 [00:00<00:00, 207.84it/s]
 73%|███████▎  | 126/173 [00:00<00:00, 205.95it/s]
 85%|████████▍ | 147/173 [00:00<00:00, 205.84it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00,

[2m[36m(func pid=14196)[0m Epoch 00064: reducing learning rate of group 0 to 1.6526e-06.


 20%|█▉        | 34/173 [00:00<00:00, 166.52it/s]
 31%|███       | 53/173 [00:00<00:00, 173.86it/s]
 41%|████      | 71/173 [00:00<00:00, 172.57it/s]
 51%|█████▏    | 89/173 [00:00<00:00, 169.75it/s]
 62%|██████▏   | 107/173 [00:00<00:00, 170.28it/s]
 73%|███████▎  | 127/173 [00:00<00:00, 177.96it/s]
 86%|████████▌ | 148/173 [00:00<00:00, 186.82it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 529.15it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
  6%|▋         | 11/173 [00:00<00:01, 109.54it/s]
 17%|█▋        | 30/173 [00:00<00:00, 154.67it/s]
 29%|██▉       | 50/173 [00:00<00:00, 173.70it/s]
 40%|███▉      | 69/173 [00:00<00:00, 176.84it/s]
 50%|█████     | 87/173 [00:00<00:00, 169.49it/s]
 70%|██████▉   | 121/173 [00:00<00:00, 166.75it/s]
 80%|███████▉  | 138/173 [00:00<00:00, 164.22it/s]
 90%|████████▉ | 155/173 [00:00<00:00, 165.19it/s]
100%|██████████| 173/173 [00:01<00:00, 164.96it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00

[2m[36m(func pid=14196)[0m Epoch 00070: reducing learning rate of group 0 to 8.2631e-07.


  9%|▊         | 15/173 [00:00<00:01, 139.16it/s]
 17%|█▋        | 29/173 [00:00<00:01, 126.57it/s]
 27%|██▋       | 47/173 [00:00<00:00, 146.78it/s]
 39%|███▉      | 68/173 [00:00<00:00, 167.99it/s]
 51%|█████▏    | 89/173 [00:00<00:00, 181.23it/s]
 64%|██████▎   | 110/173 [00:00<00:00, 189.44it/s]
 75%|███████▌  | 130/173 [00:00<00:00, 191.32it/s]
 87%|████████▋ | 150/173 [00:00<00:00, 192.85it/s]
 99%|█████████▉| 171/173 [00:00<00:00, 195.90it/s]
100%|██████████| 173/173 [00:00<00:00, 180.59it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
 11%|█         | 19/173 [00:00<00:00, 189.85it/s]
 23%|██▎       | 40/173 [00:00<00:00, 195.97it/s]
 35%|███▍      | 60/173 [00:00<00:00, 197.63it/s]
 47%|████▋     | 81/173 [00:00<00:00, 200.61it/s]
 59%|█████▉    | 102/173 [00:00<00:00, 202.16it/s]
 71%|███████   | 123/173 [00:00<00:00, 202.81it/s]
 83%|████████▎ | 144/173 [00:00<00:00, 201.13it/s]
 95%|█████████▌| 165/173 [00:00<00:00, 202.10it/s]
100%|███████

[2m[36m(func pid=14196)[0m Epoch 00076: reducing learning rate of group 0 to 4.1315e-07.


 23%|██▎       | 40/173 [00:00<00:00, 199.92it/s]
 35%|███▍      | 60/173 [00:00<00:00, 195.23it/s]
 46%|████▌     | 80/173 [00:00<00:00, 186.31it/s]
 57%|█████▋    | 99/173 [00:00<00:00, 183.78it/s]
 68%|██████▊   | 118/173 [00:00<00:00, 184.64it/s]
 79%|███████▉  | 137/173 [00:00<00:00, 183.35it/s]
 91%|█████████▏| 158/173 [00:00<00:00, 189.82it/s]
100%|██████████| 173/173 [00:00<00:00, 189.50it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 537.13it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
 12%|█▏        | 20/173 [00:00<00:00, 199.46it/s]
 35%|███▌      | 61/173 [00:00<00:00, 161.13it/s]
 47%|████▋     | 81/173 [00:00<00:00, 172.74it/s]
 59%|█████▉    | 102/173 [00:00<00:00, 184.71it/s]
 71%|███████   | 122/173 [00:00<00:00, 189.04it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 499.78it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
  8%|▊         | 13/173 [00:00<00:01, 126.93it/s]
 16%|█▌        | 28/173 [00:00<00:01, 

[2m[36m(func pid=14196)[0m Epoch 00082: reducing learning rate of group 0 to 2.0658e-07.


 23%|██▎       | 39/173 [00:00<00:00, 193.09it/s]
 34%|███▍      | 59/173 [00:00<00:00, 138.54it/s]
 44%|████▍     | 76/173 [00:00<00:00, 146.62it/s]
 55%|█████▌    | 96/173 [00:00<00:00, 162.00it/s]
 67%|██████▋   | 116/173 [00:00<00:00, 172.73it/s]
 79%|███████▊  | 136/173 [00:00<00:00, 180.19it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 452.32it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
  6%|▋         | 11/173 [00:00<00:01, 108.81it/s]
 17%|█▋        | 29/173 [00:00<00:00, 148.02it/s]
 29%|██▉       | 50/173 [00:00<00:00, 172.55it/s]
 40%|████      | 70/173 [00:00<00:00, 181.85it/s]
 52%|█████▏    | 90/173 [00:00<00:00, 186.39it/s]
 64%|██████▎   | 110/173 [00:00<00:00, 190.07it/s]
 76%|███████▌  | 131/173 [00:00<00:00, 194.24it/s]
 87%|████████▋ | 151/173 [00:00<00:00, 195.57it/s]
100%|██████████| 173/173 [00:00<00:00, 184.07it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 514.93it/s]
  0%|          | 0/173 [00:0

[2m[36m(func pid=14196)[0m Epoch 00088: reducing learning rate of group 0 to 1.0329e-07.


 17%|█▋        | 29/173 [00:00<00:00, 144.29it/s]
 28%|██▊       | 48/173 [00:00<00:00, 164.22it/s]
 39%|███▉      | 68/173 [00:00<00:00, 175.50it/s]
 51%|█████     | 88/173 [00:00<00:00, 183.48it/s]
 62%|██████▏   | 108/173 [00:00<00:00, 184.75it/s]
 74%|███████▍  | 128/173 [00:00<00:00, 188.43it/s]
 85%|████████▍ | 147/173 [00:00<00:00, 184.98it/s]
100%|██████████| 173/173 [00:00<00:00, 178.86it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 504.47it/s]
 10%|█         | 18/173 [00:00<00:00, 178.54it/s]
 21%|██        | 36/173 [00:00<00:00, 173.08it/s]
 32%|███▏      | 55/173 [00:00<00:00, 177.26it/s]
 43%|████▎     | 74/173 [00:00<00:00, 178.88it/s]
 54%|█████▍    | 94/173 [00:00<00:00, 183.06it/s]
 65%|██████▌   | 113/173 [00:00<00:00, 184.25it/s]
 77%|███████▋  | 133/173 [00:00<00:00, 188.04it/s]
 88%|████████▊ | 153/173 [00:00<00:00, 189.89it/s]
100%|██████████| 173/173 [00:00<00:00, 185.65it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████

[2m[36m(func pid=14196)[0m Epoch 00094: reducing learning rate of group 0 to 5.1644e-08.


 10%|█         | 18/173 [00:00<00:00, 178.29it/s]
 21%|██        | 36/173 [00:00<00:00, 172.00it/s]
 31%|███       | 54/173 [00:00<00:00, 175.07it/s]
 42%|████▏     | 72/173 [00:00<00:00, 176.54it/s]
 54%|█████▍    | 93/173 [00:00<00:00, 187.15it/s]
 66%|██████▋   | 115/173 [00:00<00:00, 195.27it/s]
 79%|███████▊  | 136/173 [00:00<00:00, 198.79it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 462.01it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
 10%|█         | 18/173 [00:00<00:00, 173.34it/s]
 22%|██▏       | 38/173 [00:00<00:00, 183.38it/s]
 34%|███▎      | 58/173 [00:00<00:00, 188.37it/s]
 46%|████▌     | 79/173 [00:00<00:00, 194.35it/s]
 58%|█████▊    | 100/173 [00:00<00:00, 197.97it/s]
 70%|██████▉   | 121/173 [00:00<00:00, 200.67it/s]
 82%|████████▏ | 142/173 [00:00<00:00, 200.32it/s]
100%|██████████| 173/173 [00:00<00:00, 197.76it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 504.55it/s]
  0%|          | 0/173 [00:0

[2m[36m(func pid=14196)[0m Epoch 00100: reducing learning rate of group 0 to 2.5822e-08.


 21%|██        | 36/173 [00:00<00:00, 181.17it/s]
 33%|███▎      | 57/173 [00:00<00:00, 191.43it/s]
 56%|█████▌    | 97/173 [00:00<00:00, 195.97it/s]
 68%|██████▊   | 118/173 [00:00<00:00, 198.60it/s]
 80%|████████  | 139/173 [00:00<00:00, 199.23it/s]
 92%|█████████▏| 160/173 [00:00<00:00, 202.49it/s]
100%|██████████| 173/173 [00:00<00:00, 196.35it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 505.01it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
  7%|▋         | 12/173 [00:00<00:01, 115.38it/s]
 16%|█▌        | 28/173 [00:00<00:01, 135.11it/s]
 25%|██▌       | 44/173 [00:00<00:00, 144.77it/s]
 37%|███▋      | 64/173 [00:00<00:00, 163.41it/s]
 48%|████▊     | 83/173 [00:00<00:00, 171.01it/s]
 60%|█████▉    | 103/173 [00:00<00:00, 178.31it/s]
 71%|███████   | 123/173 [00:00<00:00, 183.94it/s]
 83%|████████▎ | 143/173 [00:00<00:00, 186.99it/s]
 95%|█████████▌| 165/173 [00:00<00:00, 194.99it/s]
100%|██████████| 173/173 [00:00<00:00, 177.34it/s]
  0%|        

[2m[36m(func pid=14196)[0m Epoch 00106: reducing learning rate of group 0 to 1.2911e-08.


 10%|█         | 18/173 [00:00<00:00, 177.22it/s]
 21%|██        | 36/173 [00:00<00:00, 178.00it/s]
 33%|███▎      | 57/173 [00:00<00:00, 189.85it/s]
 46%|████▌     | 79/173 [00:00<00:00, 198.00it/s]
 58%|█████▊    | 100/173 [00:00<00:00, 199.07it/s]
 70%|██████▉   | 121/173 [00:00<00:00, 201.42it/s]
 82%|████████▏ | 142/173 [00:00<00:00, 202.95it/s]
100%|██████████| 173/173 [00:00<00:00, 198.97it/s]
  0%|          | 0/50 [00:00<?, ?it/s]
100%|██████████| 50/50 [00:00<00:00, 514.18it/s]
  0%|          | 0/173 [00:00<?, ?it/s]
 12%|█▏        | 20/173 [00:00<00:00, 190.54it/s]
 23%|██▎       | 40/173 [00:00<00:00, 172.12it/s]
 34%|███▎      | 58/173 [00:00<00:00, 165.03it/s]
 43%|████▎     | 75/173 [00:00<00:00, 165.94it/s]
 54%|█████▍    | 94/173 [00:00<00:00, 171.09it/s]
 75%|███████▌  | 130/173 [00:00<00:00, 174.56it/s]
 86%|████████▌ | 148/173 [00:00<00:00, 170.80it/s]
 96%|█████████▌| 166/173 [00:00<00:00, 172.09it/s]
100%|██████████| 173/173 [00:01<00:00, 170.75it/s]
  0%|         

[2m[36m(func pid=21444)[0m Epoch 00049: reducing learning rate of group 0 to 5.8647e-05.


  4%|▍         | 14/346 [00:00<00:02, 137.00it/s]
  8%|▊         | 29/346 [00:00<00:02, 140.50it/s]
 13%|█▎        | 44/346 [00:00<00:02, 131.72it/s]
 17%|█▋        | 59/346 [00:00<00:02, 134.92it/s]
 21%|██▏       | 74/346 [00:00<00:01, 138.31it/s]
 26%|██▌       | 89/346 [00:00<00:01, 139.32it/s]
 30%|███       | 105/346 [00:00<00:01, 143.14it/s]
 35%|███▍      | 120/346 [00:00<00:01, 142.42it/s]
 39%|███▉      | 135/346 [00:00<00:01, 142.79it/s]
 43%|████▎     | 150/346 [00:01<00:01, 144.30it/s]
 48%|████▊     | 165/346 [00:01<00:01, 142.34it/s]
 52%|█████▏    | 180/346 [00:01<00:01, 142.71it/s]
 56%|█████▋    | 195/346 [00:01<00:01, 142.13it/s]
 65%|██████▌   | 225/346 [00:01<00:00, 142.44it/s]
 69%|██████▉   | 240/346 [00:01<00:00, 140.05it/s]
 74%|███████▎  | 255/346 [00:01<00:00, 136.73it/s]
 78%|███████▊  | 269/346 [00:01<00:00, 137.02it/s]
 82%|████████▏ | 285/346 [00:02<00:00, 141.70it/s]
 87%|████████▋ | 300/346 [00:02<00:00, 141.70it/s]
 91%|█████████ | 315/346 [00:02<00:00

[2m[36m(func pid=21444)[0m Epoch 00061: reducing learning rate of group 0 to 2.9324e-05.


  6%|▋         | 22/346 [00:00<00:02, 109.12it/s]
 10%|█         | 36/346 [00:00<00:02, 122.77it/s]
 15%|█▍        | 51/346 [00:00<00:02, 130.93it/s]
 19%|█▉        | 67/346 [00:00<00:02, 138.99it/s]
 24%|██▎       | 82/346 [00:00<00:01, 141.55it/s]
 28%|██▊       | 97/346 [00:00<00:01, 139.40it/s]
 32%|███▏      | 111/346 [00:00<00:01, 136.66it/s]
 36%|███▋      | 126/346 [00:00<00:01, 137.30it/s]
 40%|████      | 140/346 [00:01<00:01, 137.59it/s]
 45%|████▍     | 155/346 [00:01<00:01, 139.79it/s]
 49%|████▉     | 170/346 [00:01<00:01, 140.63it/s]
 53%|█████▎    | 185/346 [00:01<00:01, 140.95it/s]
 58%|█████▊    | 200/346 [00:01<00:01, 142.01it/s]
 62%|██████▏   | 215/346 [00:01<00:00, 141.32it/s]
 66%|██████▋   | 230/346 [00:01<00:00, 141.45it/s]
 71%|███████   | 245/346 [00:01<00:00, 143.83it/s]
 75%|███████▌  | 260/346 [00:01<00:00, 143.69it/s]
 79%|███████▉  | 275/346 [00:01<00:00, 143.73it/s]
 84%|████████▍ | 290/346 [00:02<00:00, 141.05it/s]
 88%|████████▊ | 305/346 [00:02<00:00

[2m[36m(func pid=21444)[0m Epoch 00068: reducing learning rate of group 0 to 1.4662e-05.


  4%|▍         | 13/346 [00:00<00:02, 126.88it/s]
 11%|█▏        | 39/346 [00:00<00:02, 124.91it/s]
 16%|█▌        | 54/346 [00:00<00:02, 133.60it/s]
 20%|█▉        | 68/346 [00:00<00:02, 134.84it/s]
 24%|██▍       | 84/346 [00:00<00:01, 140.26it/s]
 29%|██▊       | 99/346 [00:00<00:01, 140.45it/s]
 33%|███▎      | 114/346 [00:00<00:01, 141.98it/s]
 37%|███▋      | 129/346 [00:00<00:01, 142.24it/s]
 46%|████▌     | 159/346 [00:01<00:01, 140.93it/s]
 50%|█████     | 174/346 [00:01<00:01, 139.77it/s]
 54%|█████▍    | 188/346 [00:01<00:01, 138.54it/s]
 58%|█████▊    | 202/346 [00:01<00:01, 137.03it/s]
 63%|██████▎   | 217/346 [00:01<00:00, 139.95it/s]
 67%|██████▋   | 232/346 [00:01<00:00, 140.85it/s]
 71%|███████▏  | 247/346 [00:01<00:00, 140.78it/s]
 76%|███████▌  | 262/346 [00:01<00:00, 142.29it/s]
 80%|████████  | 277/346 [00:01<00:00, 141.95it/s]
 84%|████████▍ | 292/346 [00:02<00:00, 140.15it/s]
 89%|████████▊ | 307/346 [00:02<00:00, 142.12it/s]
 93%|█████████▎| 322/346 [00:02<00:00

[2m[36m(func pid=21444)[0m Epoch 00075: reducing learning rate of group 0 to 7.3309e-06.


  4%|▍         | 13/346 [00:00<00:02, 126.86it/s]
 11%|█▏        | 39/346 [00:00<00:02, 122.84it/s]
 15%|█▌        | 53/346 [00:00<00:02, 127.31it/s]
 20%|█▉        | 68/346 [00:00<00:02, 134.34it/s]
 24%|██▎       | 82/346 [00:00<00:01, 136.02it/s]
 28%|██▊       | 97/346 [00:00<00:01, 138.92it/s]
 32%|███▏      | 112/346 [00:00<00:01, 141.41it/s]
 37%|███▋      | 127/346 [00:00<00:01, 142.17it/s]
 41%|████      | 142/346 [00:01<00:01, 141.36it/s]
 45%|████▌     | 157/346 [00:01<00:01, 142.19it/s]
 50%|████▉     | 172/346 [00:01<00:01, 140.30it/s]
 54%|█████▍    | 187/346 [00:01<00:01, 136.09it/s]
 58%|█████▊    | 201/346 [00:01<00:01, 136.48it/s]
 62%|██████▏   | 216/346 [00:01<00:00, 138.29it/s]
 67%|██████▋   | 231/346 [00:01<00:00, 140.84it/s]
 71%|███████   | 246/346 [00:01<00:00, 140.09it/s]
 75%|███████▌  | 261/346 [00:01<00:00, 133.11it/s]
 79%|███████▉  | 275/346 [00:02<00:00, 126.80it/s]
 83%|████████▎ | 288/346 [00:02<00:00, 122.85it/s]
 87%|████████▋ | 301/346 [00:02<00:00

[2m[36m(func pid=21444)[0m Epoch 00082: reducing learning rate of group 0 to 3.6654e-06.


  9%|▊         | 30/346 [00:00<00:02, 141.16it/s]
 13%|█▎        | 45/346 [00:00<00:02, 135.32it/s]
 17%|█▋        | 59/346 [00:00<00:02, 122.60it/s]
 21%|██        | 73/346 [00:00<00:02, 127.63it/s]
 25%|██▌       | 87/346 [00:00<00:01, 131.47it/s]
 29%|██▉       | 102/346 [00:00<00:01, 136.11it/s]
 34%|███▍      | 117/346 [00:00<00:01, 138.38it/s]
 38%|███▊      | 132/346 [00:00<00:01, 138.93it/s]
 42%|████▏     | 146/346 [00:01<00:01, 138.36it/s]
 47%|████▋     | 161/346 [00:01<00:01, 139.36it/s]
 51%|█████     | 175/346 [00:01<00:01, 138.75it/s]
 55%|█████▍    | 190/346 [00:01<00:01, 140.44it/s]
 59%|█████▉    | 205/346 [00:01<00:01, 137.94it/s]
 64%|██████▍   | 221/346 [00:01<00:00, 142.17it/s]
 68%|██████▊   | 236/346 [00:01<00:00, 138.92it/s]
 72%|███████▏  | 250/346 [00:01<00:00, 138.51it/s]
 76%|███████▋  | 264/346 [00:01<00:00, 138.40it/s]
 81%|████████  | 279/346 [00:02<00:00, 139.75it/s]
 85%|████████▍ | 294/346 [00:02<00:00, 141.54it/s]
 89%|████████▉ | 309/346 [00:02<00:0

[2m[36m(func pid=21444)[0m Epoch 00088: reducing learning rate of group 0 to 1.8327e-06.


  7%|▋         | 25/346 [00:00<00:02, 116.21it/s]
 11%|█         | 37/346 [00:00<00:02, 108.03it/s]
 15%|█▍        | 51/346 [00:00<00:02, 118.74it/s]
 19%|█▉        | 66/346 [00:00<00:02, 128.96it/s]
 23%|██▎       | 81/346 [00:00<00:01, 133.60it/s]
 28%|██▊       | 96/346 [00:00<00:01, 136.63it/s]
 32%|███▏      | 112/346 [00:00<00:01, 140.74it/s]
 37%|███▋      | 127/346 [00:00<00:01, 143.17it/s]
 41%|████      | 142/346 [00:01<00:01, 144.77it/s]
 45%|████▌     | 157/346 [00:01<00:01, 144.81it/s]
 50%|████▉     | 172/346 [00:01<00:01, 141.37it/s]
 54%|█████▍    | 187/346 [00:01<00:01, 139.83it/s]
 58%|█████▊    | 202/346 [00:01<00:01, 136.48it/s]
 62%|██████▏   | 216/346 [00:01<00:00, 135.61it/s]
 66%|██████▋   | 230/346 [00:01<00:00, 135.27it/s]
 71%|███████   | 244/346 [00:01<00:00, 136.34it/s]
 75%|███████▍  | 259/346 [00:01<00:00, 139.43it/s]
 79%|███████▉  | 273/346 [00:02<00:00, 138.81it/s]
 83%|████████▎ | 287/346 [00:02<00:00, 137.50it/s]
 87%|████████▋ | 301/346 [00:02<00:00

[2m[36m(func pid=21444)[0m Epoch 00103: reducing learning rate of group 0 to 9.1636e-07.


  9%|▊         | 30/346 [00:00<00:02, 149.09it/s]
 13%|█▎        | 45/346 [00:00<00:02, 130.08it/s]
 17%|█▋        | 59/346 [00:00<00:02, 133.66it/s]
 21%|██▏       | 74/346 [00:00<00:01, 138.23it/s]
 26%|██▌       | 90/346 [00:00<00:01, 143.04it/s]
 30%|███       | 105/346 [00:00<00:01, 142.69it/s]
 39%|███▉      | 135/346 [00:00<00:01, 139.71it/s]
 43%|████▎     | 150/346 [00:01<00:01, 139.49it/s]
 48%|████▊     | 165/346 [00:01<00:01, 139.47it/s]
 52%|█████▏    | 179/346 [00:01<00:01, 139.33it/s]
 56%|█████▌    | 194/346 [00:01<00:01, 141.09it/s]
 60%|██████    | 209/346 [00:01<00:00, 142.55it/s]
 65%|██████▍   | 224/346 [00:01<00:00, 143.47it/s]
 69%|██████▉   | 239/346 [00:01<00:00, 142.24it/s]
 73%|███████▎  | 254/346 [00:01<00:00, 138.29it/s]
 77%|███████▋  | 268/346 [00:01<00:00, 138.74it/s]
 82%|████████▏ | 283/346 [00:02<00:00, 140.44it/s]
 86%|████████▌ | 298/346 [00:02<00:00, 142.08it/s]
 90%|█████████ | 313/346 [00:02<00:00, 142.63it/s]
 95%|█████████▍| 328/346 [00:02<00:0

[2m[36m(func pid=21444)[0m Epoch 00111: reducing learning rate of group 0 to 4.5818e-07.


  4%|▍         | 14/346 [00:00<00:02, 134.42it/s]
  8%|▊         | 28/346 [00:00<00:02, 117.73it/s]
 12%|█▏        | 40/346 [00:00<00:02, 117.59it/s]
 16%|█▌        | 54/346 [00:00<00:02, 123.24it/s]
 20%|█▉        | 68/346 [00:00<00:02, 128.10it/s]
 24%|██▍       | 83/346 [00:00<00:01, 132.74it/s]
 28%|██▊       | 98/346 [00:00<00:01, 136.40it/s]
 32%|███▏      | 112/346 [00:00<00:01, 137.07it/s]
 37%|███▋      | 127/346 [00:00<00:01, 140.54it/s]
 41%|████▏     | 143/346 [00:01<00:01, 143.52it/s]
 46%|████▌     | 158/346 [00:01<00:01, 142.26it/s]
 50%|█████     | 173/346 [00:01<00:01, 140.38it/s]
 54%|█████▍    | 188/346 [00:01<00:01, 138.87it/s]
 59%|█████▊    | 203/346 [00:01<00:01, 140.48it/s]
 63%|██████▎   | 218/346 [00:01<00:00, 140.77it/s]
 67%|██████▋   | 233/346 [00:01<00:00, 140.87it/s]
 72%|███████▏  | 248/346 [00:01<00:00, 139.64it/s]
 76%|███████▌  | 263/346 [00:01<00:00, 141.79it/s]
 80%|████████  | 278/346 [00:02<00:00, 142.90it/s]
 85%|████████▍ | 293/346 [00:02<00:00,

[2m[36m(func pid=21444)[0m Epoch 00118: reducing learning rate of group 0 to 2.2909e-07.


 11%|█         | 37/346 [00:00<00:02, 109.50it/s]
 14%|█▍        | 50/346 [00:00<00:02, 114.58it/s]
 18%|█▊        | 64/346 [00:00<00:02, 120.68it/s]
 22%|██▏       | 77/346 [00:00<00:02, 122.13it/s]
 26%|██▌       | 90/346 [00:00<00:02, 124.18it/s]
 34%|███▍      | 117/346 [00:00<00:01, 127.14it/s]
 38%|███▊      | 130/346 [00:01<00:01, 123.98it/s]
 41%|████▏     | 143/346 [00:01<00:01, 125.16it/s]
 45%|████▌     | 157/346 [00:01<00:01, 128.41it/s]
 49%|████▉     | 170/346 [00:01<00:01, 128.29it/s]
 53%|█████▎    | 184/346 [00:01<00:01, 129.88it/s]
 57%|█████▋    | 198/346 [00:01<00:01, 130.83it/s]
 62%|██████▏   | 213/346 [00:01<00:00, 134.61it/s]
 66%|██████▌   | 228/346 [00:01<00:00, 137.46it/s]
 70%|██████▉   | 242/346 [00:01<00:00, 134.03it/s]
 74%|███████▍  | 256/346 [00:02<00:00, 134.76it/s]
 78%|███████▊  | 270/346 [00:02<00:00, 132.79it/s]
 82%|████████▏ | 284/346 [00:02<00:00, 131.07it/s]
 86%|████████▌ | 298/346 [00:02<00:00, 131.81it/s]
 90%|█████████ | 312/346 [00:02<00:0

[2m[36m(func pid=21444)[0m Epoch 00124: reducing learning rate of group 0 to 1.1454e-07.


  6%|▋         | 22/346 [00:00<00:02, 112.16it/s]
 10%|█         | 35/346 [00:00<00:02, 119.74it/s]
 14%|█▍        | 49/346 [00:00<00:02, 126.20it/s]
 18%|█▊        | 64/346 [00:00<00:02, 132.25it/s]
 23%|██▎       | 79/346 [00:00<00:01, 135.03it/s]
 27%|██▋       | 93/346 [00:00<00:01, 133.38it/s]
 31%|███       | 107/346 [00:00<00:01, 133.54it/s]
 35%|███▍      | 121/346 [00:00<00:01, 133.17it/s]
 39%|███▉      | 135/346 [00:01<00:01, 131.23it/s]
 43%|████▎     | 149/346 [00:01<00:01, 133.50it/s]
 47%|████▋     | 163/346 [00:01<00:01, 135.32it/s]
 51%|█████     | 177/346 [00:01<00:01, 135.32it/s]
 55%|█████▌    | 191/346 [00:01<00:01, 134.98it/s]
 60%|█████▉    | 206/346 [00:01<00:01, 136.93it/s]
 64%|██████▎   | 220/346 [00:01<00:00, 135.19it/s]
 68%|██████▊   | 236/346 [00:01<00:00, 140.33it/s]
 73%|███████▎  | 251/346 [00:01<00:00, 141.50it/s]
 81%|████████  | 281/346 [00:02<00:00, 142.72it/s]
 86%|████████▌ | 296/346 [00:02<00:00, 143.83it/s]
 90%|████████▉ | 311/346 [00:02<00:00

[2m[36m(func pid=21444)[0m Epoch 00130: reducing learning rate of group 0 to 5.7272e-08.


  7%|▋         | 24/346 [00:00<00:02, 120.82it/s]
 11%|█         | 38/346 [00:00<00:02, 129.40it/s]
 15%|█▌        | 52/346 [00:00<00:02, 130.94it/s]
 19%|█▉        | 67/346 [00:00<00:02, 135.95it/s]
 23%|██▎       | 81/346 [00:00<00:01, 133.59it/s]
 27%|██▋       | 95/346 [00:00<00:01, 132.13it/s]
 32%|███▏      | 109/346 [00:00<00:01, 133.12it/s]
 36%|███▌      | 124/346 [00:00<00:01, 135.63it/s]
 40%|███▉      | 138/346 [00:01<00:01, 136.40it/s]
 44%|████▍     | 153/346 [00:01<00:01, 138.50it/s]
 48%|████▊     | 167/346 [00:01<00:01, 138.50it/s]
 53%|█████▎    | 182/346 [00:01<00:01, 139.81it/s]
 57%|█████▋    | 197/346 [00:01<00:01, 140.83it/s]
 61%|██████▏   | 212/346 [00:01<00:00, 140.91it/s]
 66%|██████▌   | 227/346 [00:01<00:00, 138.35it/s]
 70%|██████▉   | 241/346 [00:01<00:00, 136.46it/s]
 74%|███████▍  | 256/346 [00:01<00:00, 139.18it/s]
 78%|███████▊  | 271/346 [00:01<00:00, 141.10it/s]
 83%|████████▎ | 286/346 [00:02<00:00, 142.41it/s]
 87%|████████▋ | 301/346 [00:02<00:00

[2m[36m(func pid=21444)[0m Epoch 00136: reducing learning rate of group 0 to 2.8636e-08.


  8%|▊         | 26/346 [00:00<00:02, 126.07it/s]
 12%|█▏        | 41/346 [00:00<00:02, 131.84it/s]
 16%|█▌        | 55/346 [00:00<00:02, 132.34it/s]
 20%|██        | 70/346 [00:00<00:02, 136.09it/s]
 25%|██▍       | 85/346 [00:00<00:01, 138.14it/s]
 29%|██▊       | 99/346 [00:00<00:01, 137.33it/s]
 33%|███▎      | 113/346 [00:00<00:01, 137.79it/s]
 37%|███▋      | 127/346 [00:00<00:01, 137.64it/s]
 41%|████      | 142/346 [00:01<00:01, 140.01it/s]
 45%|████▌     | 157/346 [00:01<00:01, 141.34it/s]
 50%|████▉     | 172/346 [00:01<00:01, 140.20it/s]
 54%|█████▍    | 187/346 [00:01<00:01, 135.33it/s]
 58%|█████▊    | 202/346 [00:01<00:01, 136.89it/s]
 62%|██████▏   | 216/346 [00:01<00:00, 133.30it/s]
 66%|██████▋   | 230/346 [00:01<00:00, 132.21it/s]
 71%|███████   | 244/346 [00:01<00:00, 129.59it/s]
 74%|███████▍  | 257/346 [00:01<00:00, 128.58it/s]
 78%|███████▊  | 271/346 [00:02<00:00, 129.72it/s]
 82%|████████▏ | 284/346 [00:02<00:00, 129.43it/s]
 86%|████████▌ | 297/346 [00:02<00:00

[2m[36m(func pid=21444)[0m Epoch 00142: reducing learning rate of group 0 to 1.4318e-08.


  3%|▎         | 11/346 [00:00<00:03, 105.71it/s]
  7%|▋         | 24/346 [00:00<00:02, 116.85it/s]
 11%|█         | 38/346 [00:00<00:02, 125.69it/s]
 15%|█▍        | 51/346 [00:00<00:02, 125.77it/s]
 19%|█▉        | 66/346 [00:00<00:02, 132.06it/s]
 23%|██▎       | 80/346 [00:00<00:01, 134.23it/s]
 27%|██▋       | 95/346 [00:00<00:01, 137.89it/s]
 32%|███▏      | 111/346 [00:00<00:01, 143.03it/s]
 36%|███▋      | 126/346 [00:00<00:01, 140.89it/s]
 41%|████      | 141/346 [00:01<00:01, 138.63it/s]
 45%|████▍     | 155/346 [00:01<00:01, 136.94it/s]
 49%|████▉     | 169/346 [00:01<00:01, 136.05it/s]
 53%|█████▎    | 183/346 [00:01<00:01, 133.55it/s]
 57%|█████▋    | 197/346 [00:01<00:01, 98.77it/s] 
 61%|██████    | 211/346 [00:01<00:01, 107.53it/s]
 65%|██████▌   | 226/346 [00:01<00:01, 116.84it/s]
 70%|██████▉   | 241/346 [00:01<00:00, 123.86it/s]
 74%|███████▍  | 256/346 [00:02<00:00, 129.62it/s]
 79%|███████▊  | 272/346 [00:02<00:00, 135.22it/s]
 83%|████████▎ | 288/346 [00:02<00:00,

[2m[36m(func pid=5168)[0m Epoch 00008: reducing learning rate of group 0 to 1.5119e-02.


  0%|          | 0/87 [00:00<?, ?it/s]
 13%|█▎        | 11/87 [00:00<00:00, 103.86it/s]
 25%|██▌       | 22/87 [00:00<00:00, 100.92it/s]
 38%|███▊      | 33/87 [00:00<00:00, 96.66it/s] 
 49%|████▉     | 43/87 [00:00<00:00, 94.78it/s]
 75%|███████▍  | 65/87 [00:00<00:00, 100.27it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 228.86it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 10%|█         | 9/87 [00:00<00:00, 88.69it/s]
 21%|██        | 18/87 [00:00<00:00, 78.89it/s]
 30%|██▉       | 26/87 [00:00<00:00, 78.96it/s]
 40%|████      | 35/87 [00:00<00:00, 80.09it/s]
 52%|█████▏    | 45/87 [00:00<00:00, 84.84it/s]
 75%|███████▍  | 65/87 [00:00<00:00, 90.72it/s]
 86%|████████▌ | 75/87 [00:00<00:00, 93.15it/s]
100%|██████████| 87/87 [00:00<00:00, 89.78it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 134.00it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 96.47it/s]
 24%|██▍       | 21/87 [00:00<00

[2m[36m(func pid=5168)[0m Epoch 00014: reducing learning rate of group 0 to 7.5596e-03.


 11%|█▏        | 10/87 [00:00<00:00, 89.12it/s]
 23%|██▎       | 20/87 [00:00<00:00, 90.98it/s]
 34%|███▍      | 30/87 [00:00<00:00, 94.84it/s]
 46%|████▌     | 40/87 [00:00<00:00, 94.42it/s]
 57%|█████▋    | 50/87 [00:00<00:00, 92.39it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 94.34it/s]
 82%|████████▏ | 71/87 [00:00<00:00, 96.06it/s]
100%|██████████| 87/87 [00:00<00:00, 96.28it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 242.39it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 13%|█▎        | 11/87 [00:00<00:00, 103.06it/s]
 25%|██▌       | 22/87 [00:00<00:00, 102.03it/s]
 38%|███▊      | 33/87 [00:00<00:00, 102.25it/s]
 51%|█████     | 44/87 [00:00<00:00, 100.67it/s]
 63%|██████▎   | 55/87 [00:00<00:00, 101.19it/s]
 87%|████████▋ | 76/87 [00:00<00:00, 98.75it/s] 
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 123.76it/s]
  6%|▌         | 5/87 [00:00<00:01, 45.63it/s]
 16%|█▌        | 14/87 [00:00<00:01, 69.11it/s]
 28%|██▊    

[2m[36m(func pid=5168)[0m Epoch 00020: reducing learning rate of group 0 to 3.7798e-03.


 10%|█         | 9/87 [00:00<00:00, 86.64it/s]
 22%|██▏       | 19/87 [00:00<00:00, 88.18it/s]
 32%|███▏      | 28/87 [00:00<00:00, 87.12it/s]
 44%|████▎     | 38/87 [00:00<00:00, 89.03it/s]
 67%|██████▋   | 58/87 [00:00<00:00, 93.26it/s]
 78%|███████▊  | 68/87 [00:00<00:00, 95.10it/s]
 90%|████████▉ | 78/87 [00:00<00:00, 95.96it/s]
100%|██████████| 87/87 [00:00<00:00, 92.88it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 237.76it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 10%|█         | 9/87 [00:00<00:00, 89.20it/s]
 22%|██▏       | 19/87 [00:00<00:00, 93.12it/s]
 33%|███▎      | 29/87 [00:00<00:00, 95.36it/s]
 45%|████▍     | 39/87 [00:00<00:00, 95.43it/s]
 56%|█████▋    | 49/87 [00:00<00:00, 96.77it/s]
 68%|██████▊   | 59/87 [00:00<00:00, 94.86it/s]
 79%|███████▉  | 69/87 [00:00<00:00, 94.47it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 44%|████▍     | 11/25 [00:00<00:00, 81.90it/s]
100%|██████████| 25/25 [00:00<00:00, 127.37it/s]
  0%|          | 0/

  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 92.72it/s]
 23%|██▎       | 20/87 [00:00<00:00, 86.92it/s]
 34%|███▍      | 30/87 [00:00<00:00, 91.65it/s]
 46%|████▌     | 40/87 [00:00<00:00, 86.41it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 91.45it/s]
 70%|███████   | 61/87 [00:00<00:00, 92.00it/s]
 82%|████████▏ | 71/87 [00:00<00:00, 90.34it/s]
 93%|█████████▎| 81/87 [00:00<00:00, 91.34it/s]
100%|██████████| 87/87 [00:00<00:00, 90.82it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 214.59it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 10%|█         | 9/87 [00:00<00:00, 82.75it/s]
 21%|██        | 18/87 [00:00<00:00, 81.67it/s]
 31%|███       | 27/87 [00:00<00:00, 82.72it/s]
 41%|████▏     | 36/87 [00:00<00:00, 83.59it/s]
 52%|█████▏    | 45/87 [00:00<00:00, 78.78it/s]
 61%|██████    | 53/87 [00:00<00:00, 78.60it/s]
 71%|███████▏  | 62/87 [00:00<00:00, 81.69it/s]
 82%|████████▏ | 71/87 [00:00<00:00, 81.85it/s]
100%|██████████| 87

[2m[36m(func pid=5168)[0m Epoch 00032: reducing learning rate of group 0 to 9.4495e-04.


 11%|█▏        | 10/87 [00:00<00:00, 93.95it/s]
 23%|██▎       | 20/87 [00:00<00:00, 83.59it/s]
 33%|███▎      | 29/87 [00:00<00:00, 83.81it/s]
 45%|████▍     | 39/87 [00:00<00:00, 87.20it/s]
 56%|█████▋    | 49/87 [00:00<00:00, 90.22it/s]
 68%|██████▊   | 59/87 [00:00<00:00, 92.56it/s]
 79%|███████▉  | 69/87 [00:00<00:00, 94.60it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 235.39it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 10%|█         | 9/87 [00:00<00:00, 83.30it/s]
 21%|██        | 18/87 [00:00<00:00, 83.66it/s]
 32%|███▏      | 28/87 [00:00<00:00, 90.45it/s]
 44%|████▎     | 38/87 [00:00<00:00, 88.56it/s]
 55%|█████▌    | 48/87 [00:00<00:00, 90.75it/s]
 67%|██████▋   | 58/87 [00:00<00:00, 90.70it/s]
 78%|███████▊  | 68/87 [00:00<00:00, 92.19it/s]
 90%|████████▉ | 78/87 [00:00<00:00, 92.90it/s]
100%|██████████| 87/87 [00:00<00:00, 91.94it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 136.41it/s]
  0%|          | 0

[2m[36m(func pid=5168)[0m Epoch 00038: reducing learning rate of group 0 to 4.7248e-04.


 23%|██▎       | 20/87 [00:00<00:00, 93.45it/s]
 34%|███▍      | 30/87 [00:00<00:00, 83.21it/s]
 46%|████▌     | 40/87 [00:00<00:00, 86.43it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 92.27it/s]
 83%|████████▎ | 72/87 [00:00<00:00, 97.62it/s]
 95%|█████████▌| 83/87 [00:00<00:00, 99.87it/s]
100%|██████████| 87/87 [00:00<00:00, 95.29it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 94.52it/s]
 23%|██▎       | 20/87 [00:00<00:00, 95.41it/s]
 34%|███▍      | 30/87 [00:00<00:00, 96.15it/s]
 46%|████▌     | 40/87 [00:00<00:00, 80.80it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 87.57it/s]
 70%|███████   | 61/87 [00:00<00:00, 90.73it/s]
 82%|████████▏ | 71/87 [00:00<00:00, 91.73it/s]
100%|██████████| 87/87 [00:00<00:00, 91.88it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 44%|████▍     | 11/25 [00:00<00:00, 85.14it/s]
100%|██████████| 25/25 [00:00<00:00, 128.67it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 10%|█         | 9/87 [00:0

[2m[36m(func pid=5168)[0m Epoch 00044: reducing learning rate of group 0 to 2.3624e-04.


 23%|██▎       | 20/87 [00:00<00:00, 91.61it/s]
 34%|███▍      | 30/87 [00:00<00:00, 88.36it/s]
 45%|████▍     | 39/87 [00:00<00:00, 79.51it/s]
 56%|█████▋    | 49/87 [00:00<00:00, 84.26it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 90.17it/s]
 80%|████████  | 70/87 [00:00<00:00, 91.84it/s]
100%|██████████| 87/87 [00:00<00:00, 91.47it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 245.22it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 97.87it/s]
 23%|██▎       | 20/87 [00:00<00:00, 94.79it/s]
 34%|███▍      | 30/87 [00:00<00:00, 96.68it/s]
 47%|████▋     | 41/87 [00:00<00:00, 101.05it/s]
 60%|█████▉    | 52/87 [00:00<00:00, 100.00it/s]
 72%|███████▏  | 63/87 [00:00<00:00, 97.46it/s] 
 85%|████████▌ | 74/87 [00:00<00:00, 98.94it/s]
100%|██████████| 87/87 [00:00<00:00, 98.59it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 60%|██████    | 15/25 [00:00<00:00, 97.64it/s]
100%|██████████| 25/25 [00:00<00:00, 130.14it/s]
  0%|         

[2m[36m(func pid=5168)[0m Epoch 00050: reducing learning rate of group 0 to 1.1812e-04.


 13%|█▎        | 11/87 [00:00<00:00, 101.26it/s]
 25%|██▌       | 22/87 [00:00<00:00, 99.14it/s] 
 38%|███▊      | 33/87 [00:00<00:00, 100.06it/s]
 51%|█████     | 44/87 [00:00<00:00, 101.10it/s]
 63%|██████▎   | 55/87 [00:00<00:00, 101.87it/s]
 76%|███████▌  | 66/87 [00:00<00:00, 101.60it/s]
 89%|████████▊ | 77/87 [00:00<00:00, 101.42it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 242.06it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 85.58it/s]
 23%|██▎       | 20/87 [00:00<00:00, 92.98it/s]
 34%|███▍      | 30/87 [00:00<00:00, 95.65it/s]
 47%|████▋     | 41/87 [00:00<00:00, 97.81it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 97.82it/s]
 70%|███████   | 61/87 [00:00<00:00, 97.19it/s]
 82%|████████▏ | 71/87 [00:00<00:00, 97.81it/s]
 94%|█████████▍| 82/87 [00:00<00:00, 99.32it/s]
100%|██████████| 87/87 [00:00<00:00, 97.52it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 124.52it/s]
  0%|     

[2m[36m(func pid=5168)[0m Epoch 00056: reducing learning rate of group 0 to 5.9059e-05.


 22%|██▏       | 19/87 [00:00<00:00, 92.91it/s]
 33%|███▎      | 29/87 [00:00<00:00, 93.26it/s]
 45%|████▍     | 39/87 [00:00<00:00, 85.30it/s]
 56%|█████▋    | 49/87 [00:00<00:00, 89.81it/s]
 68%|██████▊   | 59/87 [00:00<00:00, 91.79it/s]
 79%|███████▉  | 69/87 [00:00<00:00, 93.01it/s]
100%|██████████| 87/87 [00:00<00:00, 93.23it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 98.05it/s]
 23%|██▎       | 20/87 [00:00<00:00, 96.94it/s]
 34%|███▍      | 30/87 [00:00<00:00, 98.31it/s]
 46%|████▌     | 40/87 [00:00<00:00, 81.67it/s]
 57%|█████▋    | 50/87 [00:00<00:00, 86.96it/s]
 70%|███████   | 61/87 [00:00<00:00, 91.90it/s]
 82%|████████▏ | 71/87 [00:00<00:00, 93.42it/s]
100%|██████████| 87/87 [00:00<00:00, 92.93it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 127.49it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 94.71it/s]
 23%|██▎       | 20/87 [00:00<00:00, 91.21it/s]
 34%|███▍      | 3

[2m[36m(func pid=5168)[0m Epoch 00062: reducing learning rate of group 0 to 2.9530e-05.


  9%|▉         | 8/87 [00:00<00:01, 76.25it/s]
 18%|█▊        | 16/87 [00:00<00:00, 71.28it/s]
 30%|██▉       | 26/87 [00:00<00:00, 80.31it/s]
 41%|████▏     | 36/87 [00:00<00:00, 85.30it/s]
 53%|█████▎    | 46/87 [00:00<00:00, 88.13it/s]
 77%|███████▋  | 67/87 [00:00<00:00, 93.89it/s]
 89%|████████▊ | 77/87 [00:00<00:00, 92.14it/s]
100%|██████████| 87/87 [00:00<00:00, 88.26it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 229.46it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 95.88it/s]
 23%|██▎       | 20/87 [00:00<00:00, 98.21it/s]
 34%|███▍      | 30/87 [00:00<00:00, 97.83it/s]
 46%|████▌     | 40/87 [00:00<00:00, 98.51it/s]
 57%|█████▋    | 50/87 [00:00<00:00, 98.14it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 98.08it/s]
 80%|████████  | 70/87 [00:00<00:00, 96.81it/s]
 93%|█████████▎| 81/87 [00:00<00:00, 98.76it/s]
100%|██████████| 87/87 [00:00<00:00, 98.03it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
  0%|          | 0/

[2m[36m(func pid=5168)[0m Epoch 00068: reducing learning rate of group 0 to 1.4765e-05.


 10%|█         | 9/87 [00:00<00:00, 85.99it/s]
 21%|██        | 18/87 [00:00<00:00, 85.12it/s]
 31%|███       | 27/87 [00:00<00:00, 80.09it/s]
 41%|████▏     | 36/87 [00:00<00:00, 81.04it/s]
 52%|█████▏    | 45/87 [00:00<00:00, 82.69it/s]
 63%|██████▎   | 55/87 [00:00<00:00, 85.89it/s]
 74%|███████▎  | 64/87 [00:00<00:00, 84.62it/s]
 84%|████████▍ | 73/87 [00:00<00:00, 85.48it/s]
100%|██████████| 87/87 [00:01<00:00, 85.24it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 205.80it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 98.46it/s]
 23%|██▎       | 20/87 [00:00<00:00, 96.52it/s]
 36%|███▌      | 31/87 [00:00<00:00, 98.98it/s]
 47%|████▋     | 41/87 [00:00<00:00, 98.72it/s]
 59%|█████▊    | 51/87 [00:00<00:00, 98.38it/s]
 70%|███████   | 61/87 [00:00<00:00, 97.01it/s]
 94%|█████████▍| 82/87 [00:00<00:00, 98.39it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 125.62it/s]
  0%|          | 0

  0%|          | 0/87 [00:00<?, ?it/s]
 10%|█         | 9/87 [00:00<00:00, 84.01it/s]
 22%|██▏       | 19/87 [00:00<00:00, 90.11it/s]
 33%|███▎      | 29/87 [00:00<00:00, 93.24it/s]
 45%|████▍     | 39/87 [00:00<00:00, 87.76it/s]
 57%|█████▋    | 50/87 [00:00<00:00, 92.69it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 93.53it/s]
 82%|████████▏ | 71/87 [00:00<00:00, 95.87it/s]
 93%|█████████▎| 81/87 [00:00<00:00, 96.58it/s]
100%|██████████| 87/87 [00:00<00:00, 93.92it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 221.83it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 13%|█▎        | 11/87 [00:00<00:00, 101.55it/s]
 25%|██▌       | 22/87 [00:00<00:00, 97.14it/s] 
 37%|███▋      | 32/87 [00:00<00:00, 97.88it/s]
 48%|████▊     | 42/87 [00:00<00:00, 97.62it/s]
 61%|██████    | 53/87 [00:00<00:00, 99.51it/s]
 74%|███████▎  | 64/87 [00:00<00:00, 99.92it/s]
 86%|████████▌ | 75/87 [00:00<00:00, 101.07it/s]
100%|██████████| 87/87 [00:00<00:00, 99.67it/s] 
  0%|          

[2m[36m(func pid=5168)[0m Epoch 00080: reducing learning rate of group 0 to 3.6912e-06.


 11%|█▏        | 10/87 [00:00<00:00, 93.19it/s]
 23%|██▎       | 20/87 [00:00<00:00, 91.36it/s]
 34%|███▍      | 30/87 [00:00<00:00, 89.47it/s]
 45%|████▍     | 39/87 [00:00<00:00, 88.46it/s]
 56%|█████▋    | 49/87 [00:00<00:00, 90.88it/s]
 68%|██████▊   | 59/87 [00:00<00:00, 93.54it/s]
 79%|███████▉  | 69/87 [00:00<00:00, 95.36it/s]
 92%|█████████▏| 80/87 [00:00<00:00, 97.18it/s]
100%|██████████| 87/87 [00:00<00:00, 94.13it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 235.50it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 10%|█         | 9/87 [00:00<00:00, 83.43it/s]
 21%|██        | 18/87 [00:00<00:00, 85.15it/s]
 33%|███▎      | 29/87 [00:00<00:00, 94.79it/s]
 45%|████▍     | 39/87 [00:00<00:00, 94.96it/s]
 56%|█████▋    | 49/87 [00:00<00:00, 95.45it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 97.62it/s]
 80%|████████  | 70/87 [00:00<00:00, 98.36it/s]
100%|██████████| 87/87 [00:00<00:00, 96.88it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 60%|██████    | 15

[2m[36m(func pid=5168)[0m Epoch 00086: reducing learning rate of group 0 to 1.8456e-06.


 11%|█▏        | 10/87 [00:00<00:00, 98.14it/s]
 24%|██▍       | 21/87 [00:00<00:00, 102.10it/s]
 37%|███▋      | 32/87 [00:00<00:00, 96.11it/s] 
 48%|████▊     | 42/87 [00:00<00:00, 96.50it/s]
 61%|██████    | 53/87 [00:00<00:00, 98.44it/s]
 72%|███████▏  | 63/87 [00:00<00:00, 96.47it/s]
 84%|████████▍ | 73/87 [00:00<00:00, 97.29it/s]
100%|██████████| 87/87 [00:00<00:00, 97.84it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 229.66it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 93.93it/s]
 24%|██▍       | 21/87 [00:00<00:00, 99.32it/s]
 36%|███▌      | 31/87 [00:00<00:00, 98.68it/s]
 48%|████▊     | 42/87 [00:00<00:00, 100.02it/s]
 60%|█████▉    | 52/87 [00:00<00:00, 98.85it/s] 
 72%|███████▏  | 63/87 [00:00<00:00, 99.65it/s]
 85%|████████▌ | 74/87 [00:00<00:00, 100.68it/s]
 98%|█████████▊| 85/87 [00:00<00:00, 101.45it/s]
100%|██████████| 87/87 [00:00<00:00, 100.23it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████

[2m[36m(func pid=5168)[0m Epoch 00092: reducing learning rate of group 0 to 9.2280e-07.


 21%|██        | 18/87 [00:00<00:01, 63.23it/s]
 31%|███       | 27/87 [00:00<00:00, 71.58it/s]
 41%|████▏     | 36/87 [00:00<00:00, 75.20it/s]
 52%|█████▏    | 45/87 [00:00<00:00, 78.03it/s]
 63%|██████▎   | 55/87 [00:00<00:00, 82.58it/s]
 75%|███████▍  | 65/87 [00:00<00:00, 85.51it/s]
 95%|█████████▌| 83/87 [00:01<00:00, 85.51it/s]
100%|██████████| 87/87 [00:01<00:00, 81.38it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 231.91it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 94.99it/s]
 23%|██▎       | 20/87 [00:00<00:00, 94.67it/s]
 34%|███▍      | 30/87 [00:00<00:00, 92.97it/s]
 46%|████▌     | 40/87 [00:00<00:00, 94.10it/s]
 57%|█████▋    | 50/87 [00:00<00:00, 95.88it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 96.78it/s]
 82%|████████▏ | 71/87 [00:00<00:00, 97.99it/s]
 93%|█████████▎| 81/87 [00:00<00:00, 96.94it/s]
100%|██████████| 87/87 [00:00<00:00, 95.67it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 2

[2m[36m(func pid=5168)[0m Epoch 00098: reducing learning rate of group 0 to 4.6140e-07.


  0%|          | 0/87 [00:00<?, ?it/s]
 10%|█         | 9/87 [00:00<00:00, 86.23it/s]
 21%|██        | 18/87 [00:00<00:00, 81.64it/s]
 32%|███▏      | 28/87 [00:00<00:00, 86.94it/s]
 45%|████▍     | 39/87 [00:00<00:00, 93.21it/s]
 57%|█████▋    | 50/87 [00:00<00:00, 96.64it/s]
 80%|████████  | 70/87 [00:00<00:00, 96.10it/s]
 93%|█████████▎| 81/87 [00:00<00:00, 97.94it/s]
100%|██████████| 87/87 [00:00<00:00, 95.14it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 268.41it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 13%|█▎        | 11/87 [00:00<00:00, 109.17it/s]
 25%|██▌       | 22/87 [00:00<00:00, 109.07it/s]
 39%|███▉      | 34/87 [00:00<00:00, 109.89it/s]
 53%|█████▎    | 46/87 [00:00<00:00, 110.52it/s]
 67%|██████▋   | 58/87 [00:00<00:00, 111.70it/s]
 80%|████████  | 70/87 [00:00<00:00, 111.63it/s]
100%|██████████| 87/87 [00:00<00:00, 110.87it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 60%|██████    | 15/25 [00:00<00:00, 107.29it/s]
100%|██████████| 25/

[2m[36m(func pid=5168)[0m Epoch 00104: reducing learning rate of group 0 to 2.3070e-07.


 13%|█▎        | 11/87 [00:00<00:00, 110.00it/s]
 38%|███▊      | 33/87 [00:00<00:00, 101.33it/s]
 51%|█████     | 44/87 [00:00<00:00, 101.15it/s]
 64%|██████▍   | 56/87 [00:00<00:00, 106.01it/s]
 78%|███████▊  | 68/87 [00:00<00:00, 108.62it/s]
 92%|█████████▏| 80/87 [00:00<00:00, 111.02it/s]
100%|██████████| 87/87 [00:00<00:00, 106.12it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 237.13it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 13%|█▎        | 11/87 [00:00<00:00, 101.94it/s]
 26%|██▋       | 23/87 [00:00<00:00, 110.13it/s]
 40%|████      | 35/87 [00:00<00:00, 111.70it/s]
 54%|█████▍    | 47/87 [00:00<00:00, 112.01it/s]
 68%|██████▊   | 59/87 [00:00<00:00, 111.90it/s]
 82%|████████▏ | 71/87 [00:00<00:00, 113.71it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 76%|███████▌  | 19/25 [00:00<00:00, 111.62it/s]
100%|██████████| 25/25 [00:00<00:00, 124.24it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 93.06it/s]
 23%|██▎    

[2m[36m(func pid=5168)[0m Epoch 00110: reducing learning rate of group 0 to 1.1535e-07.


 13%|█▎        | 11/87 [00:00<00:00, 106.21it/s]
 25%|██▌       | 22/87 [00:00<00:00, 103.86it/s]
 38%|███▊      | 33/87 [00:00<00:00, 104.32it/s]
 52%|█████▏    | 45/87 [00:00<00:00, 108.25it/s]
 64%|██████▍   | 56/87 [00:00<00:00, 105.69it/s]
 77%|███████▋  | 67/87 [00:00<00:00, 102.76it/s]
 90%|████████▉ | 78/87 [00:00<00:00, 104.91it/s]
100%|██████████| 87/87 [00:00<00:00, 105.35it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 204.05it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 96.43it/s]
 23%|██▎       | 20/87 [00:00<00:00, 84.82it/s]
 36%|███▌      | 31/87 [00:00<00:00, 91.86it/s]
 49%|████▉     | 43/87 [00:00<00:00, 101.02it/s]
 62%|██████▏   | 54/87 [00:00<00:00, 103.38it/s]
 76%|███████▌  | 66/87 [00:00<00:00, 106.66it/s]
 90%|████████▉ | 78/87 [00:00<00:00, 108.48it/s]
100%|██████████| 87/87 [00:00<00:00, 102.51it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
 44%|████▍     | 11/25 [00:00<00:00, 93.02it/s]
100%|

[2m[36m(func pid=5168)[0m Epoch 00116: reducing learning rate of group 0 to 5.7675e-08.


 11%|█▏        | 10/87 [00:00<00:00, 93.91it/s]
 23%|██▎       | 20/87 [00:00<00:00, 94.69it/s]
 34%|███▍      | 30/87 [00:00<00:00, 86.63it/s]
 46%|████▌     | 40/87 [00:00<00:00, 90.75it/s]
 57%|█████▋    | 50/87 [00:00<00:00, 89.16it/s]
 69%|██████▉   | 60/87 [00:00<00:00, 90.20it/s]
 82%|████████▏ | 71/87 [00:00<00:00, 93.45it/s]
 94%|█████████▍| 82/87 [00:00<00:00, 96.57it/s]
100%|██████████| 87/87 [00:00<00:00, 93.50it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 11%|█▏        | 10/87 [00:00<00:00, 89.97it/s]
 22%|██▏       | 19/87 [00:00<00:00, 78.94it/s]
 32%|███▏      | 28/87 [00:00<00:00, 82.89it/s]
 43%|████▎     | 37/87 [00:00<00:00, 79.17it/s]
 64%|██████▍   | 56/87 [00:00<00:00, 85.16it/s]
 76%|███████▌  | 66/87 [00:00<00:00, 89.18it/s]
 89%|████████▊ | 77/87 [00:00<00:00, 94.10it/s]
100%|██████████| 87/87 [00:00<00:00, 88.94it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 147.18it/s]
  0%|          | 0

[2m[36m(func pid=5168)[0m Epoch 00122: reducing learning rate of group 0 to 2.8838e-08.


 13%|█▎        | 11/87 [00:00<00:00, 101.53it/s]
 25%|██▌       | 22/87 [00:00<00:00, 88.35it/s] 
 37%|███▋      | 32/87 [00:00<00:00, 91.48it/s]
 49%|████▉     | 43/87 [00:00<00:00, 97.55it/s]
 62%|██████▏   | 54/87 [00:00<00:00, 99.04it/s]
 75%|███████▍  | 65/87 [00:00<00:00, 99.73it/s]
 87%|████████▋ | 76/87 [00:00<00:00, 100.01it/s]
100%|██████████| 87/87 [00:00<00:00, 99.18it/s] 
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 262.93it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 13%|█▎        | 11/87 [00:00<00:00, 107.85it/s]
 25%|██▌       | 22/87 [00:00<00:00, 101.93it/s]
 38%|███▊      | 33/87 [00:00<00:00, 101.01it/s]
 51%|█████     | 44/87 [00:00<00:00, 101.80it/s]
 63%|██████▎   | 55/87 [00:00<00:00, 101.46it/s]
 76%|███████▌  | 66/87 [00:00<00:00, 102.57it/s]
 89%|████████▊ | 77/87 [00:00<00:00, 101.81it/s]
100%|██████████| 87/87 [00:00<00:00, 102.55it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 144.21it/s]
  0%|

[2m[36m(func pid=5168)[0m Epoch 00128: reducing learning rate of group 0 to 1.4419e-08.


 25%|██▌       | 22/87 [00:00<00:00, 100.44it/s]
 38%|███▊      | 33/87 [00:00<00:00, 99.12it/s] 
 49%|████▉     | 43/87 [00:00<00:00, 98.41it/s]
 62%|██████▏   | 54/87 [00:00<00:00, 99.76it/s]
 75%|███████▍  | 65/87 [00:00<00:00, 100.79it/s]
 87%|████████▋ | 76/87 [00:00<00:00, 101.37it/s]
100%|██████████| 87/87 [00:00<00:00, 100.94it/s]
  0%|          | 0/25 [00:00<?, ?it/s]
100%|██████████| 25/25 [00:00<00:00, 258.14it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
 13%|█▎        | 11/87 [00:00<00:00, 104.83it/s]
 25%|██▌       | 22/87 [00:00<00:00, 100.09it/s]
 38%|███▊      | 33/87 [00:00<00:00, 99.95it/s] 
 51%|█████     | 44/87 [00:00<00:00, 101.84it/s]
 63%|██████▎   | 55/87 [00:00<00:00, 101.79it/s]
 76%|███████▌  | 66/87 [00:00<00:00, 102.10it/s]
100%|██████████| 25/25 [00:00<00:00, 124.44it/s]
  0%|          | 0/87 [00:00<?, ?it/s]
  9%|▉         | 8/87 [00:00<00:01, 77.01it/s]
 21%|██        | 18/87 [00:00<00:00, 85.40it/s]
 32%|███▏      | 28/87 [00:00<00:00, 89.16it/s]
 44%|██

[2m[36m(func pid=22592)[0m Epoch 00008: reducing learning rate of group 0 to 4.3507e-02.


  3%|▎         | 11/346 [00:00<00:03, 107.66it/s]
  6%|▋         | 22/346 [00:00<00:03, 89.22it/s] 
  9%|▉         | 32/346 [00:00<00:03, 88.64it/s]
 12%|█▏        | 43/346 [00:00<00:03, 93.47it/s]
 16%|█▌        | 54/346 [00:00<00:02, 97.94it/s]
 18%|█▊        | 64/346 [00:00<00:02, 98.52it/s]
 22%|██▏       | 75/346 [00:00<00:02, 100.01it/s]
 25%|██▍       | 86/346 [00:00<00:02, 100.38it/s]
 28%|██▊       | 97/346 [00:00<00:02, 101.98it/s]
 31%|███       | 108/346 [00:01<00:02, 104.13it/s]
 34%|███▍      | 119/346 [00:01<00:02, 103.93it/s]
 38%|███▊      | 131/346 [00:01<00:02, 106.85it/s]
 41%|████      | 142/346 [00:01<00:01, 107.73it/s]
 44%|████▍     | 153/346 [00:01<00:01, 108.38it/s]
 47%|████▋     | 164/346 [00:01<00:01, 107.78it/s]
 51%|█████     | 175/346 [00:01<00:01, 108.08it/s]
 54%|█████▍    | 186/346 [00:01<00:01, 107.93it/s]
 57%|█████▋    | 197/346 [00:01<00:01, 108.35it/s]
 60%|██████    | 209/346 [00:02<00:01, 109.64it/s]
 67%|██████▋   | 231/346 [00:02<00:01, 107.9

[2m[36m(func pid=22592)[0m Epoch 00014: reducing learning rate of group 0 to 2.1754e-02.


  3%|▎         | 9/346 [00:00<00:03, 89.29it/s]
  6%|▌         | 20/346 [00:00<00:03, 98.51it/s]
 12%|█▏        | 41/346 [00:00<00:03, 95.62it/s]
 15%|█▌        | 53/346 [00:00<00:02, 102.63it/s]
 19%|█▉        | 65/346 [00:00<00:02, 106.93it/s]
 22%|██▏       | 77/346 [00:00<00:02, 110.63it/s]
 26%|██▌       | 89/346 [00:00<00:02, 112.91it/s]
 33%|███▎      | 113/346 [00:01<00:02, 114.04it/s]
 36%|███▌      | 125/346 [00:01<00:01, 112.79it/s]
 40%|███▉      | 137/346 [00:01<00:01, 113.36it/s]
 43%|████▎     | 149/346 [00:01<00:01, 114.43it/s]
 47%|████▋     | 161/346 [00:01<00:01, 112.18it/s]
 50%|█████     | 173/346 [00:01<00:01, 112.39it/s]
 53%|█████▎    | 185/346 [00:01<00:01, 111.80it/s]
 57%|█████▋    | 197/346 [00:01<00:01, 113.13it/s]
 60%|██████    | 209/346 [00:01<00:01, 111.32it/s]
 64%|██████▍   | 221/346 [00:02<00:01, 109.94it/s]
 67%|██████▋   | 233/346 [00:02<00:01, 111.87it/s]
 71%|███████   | 245/346 [00:02<00:00, 112.59it/s]
 75%|███████▍  | 258/346 [00:02<00:00, 115

[2m[36m(func pid=22592)[0m Epoch 00022: reducing learning rate of group 0 to 1.0877e-02.


  3%|▎         | 10/346 [00:00<00:03, 96.18it/s]
  6%|▌         | 20/346 [00:00<00:03, 96.13it/s]
 12%|█▏        | 40/346 [00:00<00:03, 95.88it/s]
 15%|█▍        | 51/346 [00:00<00:02, 99.80it/s]
 18%|█▊        | 62/346 [00:00<00:02, 102.17it/s]
 21%|██▏       | 74/346 [00:00<00:02, 106.74it/s]
 25%|██▍       | 86/346 [00:00<00:02, 110.00it/s]
 28%|██▊       | 98/346 [00:00<00:02, 112.36it/s]
 32%|███▏      | 111/346 [00:01<00:02, 116.17it/s]
 36%|███▌      | 123/346 [00:01<00:01, 114.44it/s]
 39%|███▉      | 136/346 [00:01<00:01, 116.44it/s]
 43%|████▎     | 149/346 [00:01<00:01, 117.73it/s]
 47%|████▋     | 161/346 [00:01<00:01, 116.77it/s]
 50%|█████     | 173/346 [00:01<00:01, 117.10it/s]
 53%|█████▎    | 185/346 [00:01<00:01, 112.76it/s]
 57%|█████▋    | 197/346 [00:01<00:01, 113.54it/s]
 60%|██████    | 209/346 [00:01<00:01, 115.38it/s]
 64%|██████▍   | 222/346 [00:01<00:01, 117.69it/s]
 68%|██████▊   | 235/346 [00:02<00:00, 119.72it/s]
 71%|███████▏  | 247/346 [00:02<00:00, 118.

[2m[36m(func pid=22592)[0m Epoch 00041: reducing learning rate of group 0 to 5.4384e-03.


  3%|▎         | 9/346 [00:00<00:04, 83.05it/s]
  5%|▌         | 19/346 [00:00<00:03, 91.40it/s]
  8%|▊         | 29/346 [00:00<00:03, 85.63it/s]
 11%|█         | 38/346 [00:00<00:03, 85.86it/s]
 14%|█▍        | 49/346 [00:00<00:03, 91.13it/s]
 18%|█▊        | 61/346 [00:00<00:02, 98.06it/s]
 21%|██        | 73/346 [00:00<00:02, 104.15it/s]
 28%|██▊       | 97/346 [00:00<00:02, 109.27it/s]
 31%|███       | 108/346 [00:01<00:02, 109.28it/s]
 34%|███▍      | 119/346 [00:01<00:02, 109.17it/s]
 38%|███▊      | 130/346 [00:01<00:02, 107.79it/s]
 41%|████      | 141/346 [00:01<00:01, 105.92it/s]
 44%|████▍     | 153/346 [00:01<00:01, 109.41it/s]
 48%|████▊     | 166/346 [00:01<00:01, 113.39it/s]
 51%|█████▏    | 178/346 [00:01<00:01, 109.61it/s]
 55%|█████▌    | 191/346 [00:01<00:01, 113.02it/s]
 59%|█████▊    | 203/346 [00:01<00:01, 112.43it/s]
 62%|██████▏   | 215/346 [00:02<00:01, 112.77it/s]
 66%|██████▌   | 227/346 [00:02<00:01, 114.55it/s]
 69%|██████▉   | 239/346 [00:02<00:00, 113.48i

[2m[36m(func pid=22592)[0m Epoch 00053: reducing learning rate of group 0 to 2.7192e-03.


  3%|▎         | 10/346 [00:00<00:03, 97.34it/s]
  6%|▌         | 20/346 [00:00<00:03, 92.81it/s]
  9%|▊         | 30/346 [00:00<00:03, 95.91it/s]
 12%|█▏        | 42/346 [00:00<00:02, 102.03it/s]
 16%|█▌        | 54/346 [00:00<00:02, 107.99it/s]
 19%|█▉        | 66/346 [00:00<00:02, 111.92it/s]
 23%|██▎       | 78/346 [00:00<00:02, 113.07it/s]
 26%|██▌       | 90/346 [00:00<00:02, 114.05it/s]
 29%|██▉       | 102/346 [00:00<00:02, 111.88it/s]
 33%|███▎      | 114/346 [00:01<00:02, 112.96it/s]
 36%|███▋      | 126/346 [00:01<00:01, 112.40it/s]
 40%|████      | 139/346 [00:01<00:01, 114.80it/s]
 44%|████▎     | 151/346 [00:01<00:01, 116.02it/s]
 47%|████▋     | 163/346 [00:01<00:01, 116.52it/s]
 51%|█████     | 175/346 [00:01<00:01, 117.15it/s]
 54%|█████▍    | 187/346 [00:01<00:01, 115.25it/s]
 58%|█████▊    | 200/346 [00:01<00:01, 117.16it/s]
 62%|██████▏   | 213/346 [00:01<00:01, 118.41it/s]
 65%|██████▌   | 226/346 [00:01<00:01, 119.50it/s]
 69%|██████▉   | 238/346 [00:02<00:00, 117

[2m[36m(func pid=22592)[0m Epoch 00066: reducing learning rate of group 0 to 1.3596e-03.


  3%|▎         | 10/346 [00:00<00:03, 98.96it/s]
  6%|▌         | 21/346 [00:00<00:03, 99.73it/s]
  9%|▉         | 31/346 [00:00<00:03, 90.67it/s]
 12%|█▏        | 42/346 [00:00<00:03, 95.85it/s]
 16%|█▌        | 54/346 [00:00<00:02, 102.37it/s]
 19%|█▉        | 66/346 [00:00<00:02, 107.30it/s]
 23%|██▎       | 78/346 [00:00<00:02, 110.77it/s]
 26%|██▌       | 90/346 [00:00<00:02, 113.48it/s]
 29%|██▉       | 102/346 [00:00<00:02, 115.13it/s]
 33%|███▎      | 115/346 [00:01<00:01, 117.81it/s]
 37%|███▋      | 128/346 [00:01<00:01, 119.37it/s]
 40%|████      | 140/346 [00:01<00:01, 119.51it/s]
 44%|████▍     | 152/346 [00:01<00:01, 119.62it/s]
 47%|████▋     | 164/346 [00:01<00:01, 119.02it/s]
 51%|█████     | 176/346 [00:01<00:01, 119.15it/s]
 58%|█████▊    | 201/346 [00:01<00:01, 118.90it/s]
 62%|██████▏   | 214/346 [00:01<00:01, 120.08it/s]
 66%|██████▌   | 227/346 [00:01<00:00, 119.40it/s]
 69%|██████▉   | 240/346 [00:02<00:00, 119.46it/s]
 73%|███████▎  | 252/346 [00:02<00:00, 119.

[2m[36m(func pid=22592)[0m Epoch 00083: reducing learning rate of group 0 to 6.7980e-04.


  2%|▏         | 8/346 [00:00<00:04, 77.93it/s]
  5%|▌         | 19/346 [00:00<00:03, 93.70it/s]
  9%|▊         | 30/346 [00:00<00:03, 99.93it/s]
 12%|█▏        | 42/346 [00:00<00:02, 107.29it/s]
 16%|█▌        | 54/346 [00:00<00:02, 109.72it/s]
 19%|█▉        | 66/346 [00:00<00:02, 110.11it/s]
 23%|██▎       | 78/346 [00:00<00:02, 106.03it/s]
 26%|██▌       | 90/346 [00:00<00:02, 107.54it/s]
 29%|██▉       | 101/346 [00:00<00:02, 107.64it/s]
 32%|███▏      | 112/346 [00:01<00:02, 105.18it/s]
 36%|███▌      | 124/346 [00:01<00:02, 108.27it/s]
 39%|███▉      | 136/346 [00:01<00:01, 108.85it/s]
 43%|████▎     | 148/346 [00:01<00:01, 109.82it/s]
 46%|████▌     | 160/346 [00:01<00:01, 111.68it/s]
 50%|████▉     | 172/346 [00:01<00:01, 112.97it/s]
 53%|█████▎    | 185/346 [00:01<00:01, 115.80it/s]
 57%|█████▋    | 197/346 [00:01<00:01, 112.29it/s]
 60%|██████    | 209/346 [00:01<00:01, 111.81it/s]
 64%|██████▍   | 221/346 [00:02<00:01, 113.89it/s]
 67%|██████▋   | 233/346 [00:02<00:01, 111.

[2m[36m(func pid=22592)[0m Epoch 00089: reducing learning rate of group 0 to 3.3990e-04.


  3%|▎         | 9/346 [00:00<00:03, 84.64it/s]
  5%|▌         | 19/346 [00:00<00:03, 88.95it/s]
  8%|▊         | 28/346 [00:00<00:03, 89.13it/s]
 11%|█         | 37/346 [00:00<00:03, 86.77it/s]
 14%|█▍        | 48/346 [00:00<00:03, 94.23it/s]
 17%|█▋        | 60/346 [00:00<00:02, 99.74it/s]
 21%|██        | 72/346 [00:00<00:02, 104.72it/s]
 24%|██▍       | 83/346 [00:00<00:02, 105.69it/s]
 30%|███       | 105/346 [00:01<00:02, 106.94it/s]
 34%|███▍      | 117/346 [00:01<00:02, 108.53it/s]
 37%|███▋      | 129/346 [00:01<00:01, 110.01it/s]
 40%|████      | 140/346 [00:01<00:01, 107.21it/s]
 44%|████▎     | 151/346 [00:01<00:01, 107.02it/s]
 47%|████▋     | 163/346 [00:01<00:01, 109.18it/s]
 54%|█████▍    | 187/346 [00:01<00:01, 110.09it/s]
 58%|█████▊    | 199/346 [00:01<00:01, 110.35it/s]
 61%|██████    | 211/346 [00:02<00:01, 110.97it/s]
 64%|██████▍   | 223/346 [00:02<00:01, 110.07it/s]
 68%|██████▊   | 235/346 [00:02<00:01, 106.83it/s]
 71%|███████   | 246/346 [00:02<00:00, 107.66i

[2m[36m(func pid=22592)[0m Epoch 00099: reducing learning rate of group 0 to 1.6995e-04.


  3%|▎         | 10/346 [00:00<00:03, 91.77it/s]
  6%|▌         | 21/346 [00:00<00:03, 98.95it/s]
  9%|▉         | 31/346 [00:00<00:03, 87.92it/s]
 16%|█▌        | 54/346 [00:00<00:02, 100.92it/s]
 19%|█▉        | 65/346 [00:00<00:02, 101.70it/s]
 22%|██▏       | 77/346 [00:00<00:02, 105.70it/s]
 26%|██▌       | 89/346 [00:00<00:02, 109.80it/s]
 29%|██▉       | 101/346 [00:00<00:02, 111.48it/s]
 33%|███▎      | 114/346 [00:01<00:02, 114.69it/s]
 37%|███▋      | 127/346 [00:01<00:01, 116.49it/s]
 44%|████▍     | 152/346 [00:01<00:01, 117.22it/s]
 48%|████▊     | 165/346 [00:01<00:01, 119.03it/s]
 51%|█████     | 177/346 [00:01<00:01, 118.02it/s]
 55%|█████▍    | 189/346 [00:01<00:01, 115.54it/s]
 58%|█████▊    | 201/346 [00:01<00:01, 115.27it/s]
 62%|██████▏   | 213/346 [00:01<00:01, 113.58it/s]
 65%|██████▌   | 225/346 [00:02<00:01, 110.68it/s]
 68%|██████▊   | 237/346 [00:02<00:00, 111.50it/s]
 72%|███████▏  | 250/346 [00:02<00:00, 114.12it/s]
 76%|███████▌  | 263/346 [00:02<00:00, 11

[2m[36m(func pid=22592)[0m Epoch 00107: reducing learning rate of group 0 to 8.4975e-05.


  6%|▌         | 20/346 [00:00<00:03, 97.88it/s]
  9%|▉         | 31/346 [00:00<00:03, 102.80it/s]
 12%|█▏        | 43/346 [00:00<00:02, 106.51it/s]
 16%|█▌        | 55/346 [00:00<00:02, 109.42it/s]
 20%|█▉        | 68/346 [00:00<00:02, 113.87it/s]
 23%|██▎       | 81/346 [00:00<00:02, 116.07it/s]
 30%|███       | 105/346 [00:00<00:02, 116.04it/s]
 34%|███▍      | 117/346 [00:01<00:01, 117.14it/s]
 37%|███▋      | 129/346 [00:01<00:01, 116.94it/s]
 41%|████      | 141/346 [00:01<00:01, 113.41it/s]
 44%|████▍     | 153/346 [00:01<00:01, 113.07it/s]
 48%|████▊     | 166/346 [00:01<00:01, 116.10it/s]
 52%|█████▏    | 179/346 [00:01<00:01, 118.33it/s]
 55%|█████▌    | 192/346 [00:01<00:01, 119.25it/s]
 59%|█████▉    | 205/346 [00:01<00:01, 119.98it/s]
 63%|██████▎   | 218/346 [00:01<00:01, 119.80it/s]
 67%|██████▋   | 231/346 [00:02<00:00, 120.24it/s]
 71%|███████   | 244/346 [00:02<00:00, 119.89it/s]
 74%|███████▍  | 256/346 [00:02<00:00, 118.20it/s]
 77%|███████▋  | 268/346 [00:02<00:00,

[2m[36m(func pid=22592)[0m Epoch 00113: reducing learning rate of group 0 to 4.2487e-05.


  5%|▌         | 19/346 [00:00<00:03, 93.00it/s]
  8%|▊         | 29/346 [00:00<00:03, 88.29it/s]
 12%|█▏        | 41/346 [00:00<00:03, 96.37it/s]
 15%|█▌        | 52/346 [00:00<00:02, 100.60it/s]
 18%|█▊        | 64/346 [00:00<00:02, 105.83it/s]
 22%|██▏       | 76/346 [00:00<00:02, 109.53it/s]
 25%|██▌       | 87/346 [00:00<00:02, 109.30it/s]
 29%|██▊       | 99/346 [00:00<00:02, 110.27it/s]
 32%|███▏      | 112/346 [00:01<00:02, 113.51it/s]
 36%|███▌      | 125/346 [00:01<00:01, 116.21it/s]
 40%|███▉      | 137/346 [00:01<00:01, 116.34it/s]
 43%|████▎     | 149/346 [00:01<00:01, 112.16it/s]
 47%|████▋     | 161/346 [00:01<00:01, 113.41it/s]
 50%|█████     | 173/346 [00:01<00:01, 113.02it/s]
 54%|█████▍    | 186/346 [00:01<00:01, 116.63it/s]
 58%|█████▊    | 199/346 [00:01<00:01, 117.99it/s]
 61%|██████    | 211/346 [00:01<00:01, 118.34it/s]
 65%|██████▍   | 224/346 [00:02<00:01, 119.66it/s]
 68%|██████▊   | 237/346 [00:02<00:00, 121.90it/s]
 72%|███████▏  | 250/346 [00:02<00:00, 120

[2m[36m(func pid=22592)[0m Epoch 00124: reducing learning rate of group 0 to 2.1244e-05.


  3%|▎         | 10/346 [00:00<00:03, 93.80it/s]
  9%|▉         | 32/346 [00:00<00:03, 99.86it/s]
 12%|█▏        | 42/346 [00:00<00:03, 94.95it/s]
 15%|█▌        | 52/346 [00:00<00:03, 95.14it/s]
 18%|█▊        | 64/346 [00:00<00:02, 101.81it/s]
 22%|██▏       | 76/346 [00:00<00:02, 107.24it/s]
 26%|██▌       | 89/346 [00:00<00:02, 111.41it/s]
 29%|██▉       | 101/346 [00:00<00:02, 111.74it/s]
 36%|███▌      | 125/346 [00:01<00:01, 112.01it/s]
 40%|███▉      | 138/346 [00:01<00:01, 115.66it/s]
 44%|████▎     | 151/346 [00:01<00:01, 117.38it/s]
 47%|████▋     | 163/346 [00:01<00:01, 115.75it/s]
 51%|█████     | 175/346 [00:01<00:01, 113.11it/s]
 54%|█████▍    | 187/346 [00:01<00:01, 113.42it/s]
 58%|█████▊    | 199/346 [00:01<00:01, 110.89it/s]
 61%|██████    | 211/346 [00:01<00:01, 110.94it/s]
 64%|██████▍   | 223/346 [00:02<00:01, 111.66it/s]
 68%|██████▊   | 235/346 [00:02<00:00, 114.02it/s]
 72%|███████▏  | 248/346 [00:02<00:00, 116.22it/s]
 75%|███████▌  | 261/346 [00:02<00:00, 117

[2m[36m(func pid=22592)[0m Epoch 00132: reducing learning rate of group 0 to 1.0622e-05.


  3%|▎         | 10/346 [00:00<00:03, 98.79it/s]
  6%|▌         | 20/346 [00:00<00:03, 93.25it/s]
  9%|▊         | 30/346 [00:00<00:03, 92.45it/s]
 12%|█▏        | 41/346 [00:00<00:03, 98.04it/s]
 15%|█▌        | 52/346 [00:00<00:02, 102.07it/s]
 18%|█▊        | 64/346 [00:00<00:02, 105.67it/s]
 22%|██▏       | 76/346 [00:00<00:02, 107.76it/s]
 25%|██▌       | 88/346 [00:00<00:02, 109.51it/s]
 32%|███▏      | 112/346 [00:01<00:02, 109.91it/s]
 36%|███▌      | 123/346 [00:01<00:02, 107.83it/s]
 39%|███▊      | 134/346 [00:01<00:01, 106.57it/s]
 42%|████▏     | 146/346 [00:01<00:01, 108.35it/s]
 46%|████▌     | 158/346 [00:01<00:01, 110.57it/s]
 49%|████▉     | 170/346 [00:01<00:01, 110.93it/s]
 53%|█████▎    | 182/346 [00:01<00:01, 111.07it/s]
 60%|█████▉    | 206/346 [00:01<00:01, 111.24it/s]
 63%|██████▎   | 218/346 [00:02<00:01, 112.43it/s]
 66%|██████▋   | 230/346 [00:02<00:01, 109.65it/s]
 70%|██████▉   | 242/346 [00:02<00:00, 110.45it/s]
 73%|███████▎  | 254/346 [00:02<00:00, 109.

[2m[36m(func pid=22592)[0m Epoch 00145: reducing learning rate of group 0 to 5.3109e-06.


  5%|▌         | 19/346 [00:00<00:03, 94.25it/s]
  8%|▊         | 29/346 [00:00<00:03, 90.22it/s]
 11%|█▏        | 39/346 [00:00<00:03, 92.25it/s]
 15%|█▌        | 52/346 [00:00<00:02, 103.01it/s]
 19%|█▉        | 65/346 [00:00<00:02, 108.77it/s]
 23%|██▎       | 78/346 [00:00<00:02, 113.09it/s]
 26%|██▋       | 91/346 [00:00<00:02, 116.67it/s]
 30%|███       | 104/346 [00:00<00:02, 118.53it/s]
 34%|███▍      | 117/346 [00:01<00:01, 121.52it/s]
 38%|███▊      | 130/346 [00:01<00:01, 122.74it/s]
 41%|████▏     | 143/346 [00:01<00:01, 123.26it/s]
 49%|████▉     | 169/346 [00:01<00:01, 124.65it/s]
 53%|█████▎    | 182/346 [00:01<00:01, 123.97it/s]
 56%|█████▋    | 195/346 [00:01<00:01, 122.52it/s]
 60%|██████    | 208/346 [00:01<00:01, 122.58it/s]
 64%|██████▍   | 221/346 [00:01<00:01, 122.87it/s]
 68%|██████▊   | 234/346 [00:02<00:00, 122.59it/s]
 71%|███████▏  | 247/346 [00:02<00:00, 121.24it/s]
 75%|███████▌  | 260/346 [00:02<00:00, 119.23it/s]
 79%|███████▊  | 272/346 [00:02<00:00, 11

[2m[36m(func pid=6080)[0m Epoch 00011: reducing learning rate of group 0 to 1.2194e-02.


 13%|█▎        | 21/162 [00:00<00:00, 200.20it/s]
 41%|████▏     | 67/162 [00:00<00:00, 220.48it/s]
 56%|█████▌    | 91/162 [00:00<00:00, 225.62it/s]
 72%|███████▏  | 116/162 [00:00<00:00, 231.65it/s]
 86%|████████▋ | 140/162 [00:00<00:00, 231.49it/s]
100%|██████████| 47/47 [00:00<00:00, 593.00it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 12%|█▏        | 20/162 [00:00<00:00, 199.25it/s]
 25%|██▍       | 40/162 [00:00<00:00, 181.38it/s]
 38%|███▊      | 61/162 [00:00<00:00, 190.54it/s]
 50%|█████     | 81/162 [00:00<00:00, 176.85it/s]
 61%|██████    | 99/162 [00:00<00:00, 168.43it/s]
 72%|███████▏  | 117/162 [00:00<00:00, 170.02it/s]
 85%|████████▍ | 137/162 [00:00<00:00, 178.48it/s]
100%|██████████| 162/162 [00:00<00:00, 176.76it/s]
100%|██████████| 47/47 [00:00<00:00, 768.87it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 28%|██▊       | 46/162 [00:00<00:00, 223.35it/s]
 43%|████▎     | 69/162 [00:00<00:00, 225.68it/s]
 58%|█████▊    | 94/162 [00:00<00:00, 231.73it/s]
 73%|███████▎  | 

[2m[36m(func pid=6080)[0m Epoch 00021: reducing learning rate of group 0 to 6.0968e-03.


 14%|█▍        | 23/162 [00:00<00:00, 222.85it/s]
 28%|██▊       | 46/162 [00:00<00:00, 220.10it/s]
 43%|████▎     | 69/162 [00:00<00:00, 212.69it/s]
 56%|█████▌    | 91/162 [00:00<00:00, 213.10it/s]
 70%|███████   | 114/162 [00:00<00:00, 218.73it/s]
 86%|████████▌ | 139/162 [00:00<00:00, 226.63it/s]
100%|██████████| 162/162 [00:00<00:00, 222.76it/s]
100%|██████████| 47/47 [00:00<00:00, 770.90it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 14%|█▍        | 23/162 [00:00<00:00, 227.71it/s]
 28%|██▊       | 46/162 [00:00<00:00, 225.32it/s]
 43%|████▎     | 69/162 [00:00<00:00, 227.09it/s]
 57%|█████▋    | 92/162 [00:00<00:00, 225.73it/s]
 71%|███████   | 115/162 [00:00<00:00, 221.03it/s]
 85%|████████▌ | 138/162 [00:00<00:00, 213.32it/s]
100%|██████████| 162/162 [00:00<00:00, 217.16it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 727.44it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 15%|█▍        | 24/162 [00:00<00:00, 236.39it/s]
 30%|███       | 49/162 [00

[2m[36m(func pid=6080)[0m Epoch 00038: reducing learning rate of group 0 to 3.0484e-03.


 30%|██▉       | 48/162 [00:00<00:00, 236.35it/s]
 44%|████▍     | 72/162 [00:00<00:00, 227.78it/s]
 59%|█████▊    | 95/162 [00:00<00:00, 211.05it/s]
 88%|████████▊ | 142/162 [00:00<00:00, 224.21it/s]
100%|██████████| 47/47 [00:00<00:00, 722.61it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 11%|█         | 18/162 [00:00<00:00, 176.25it/s]
 25%|██▌       | 41/162 [00:00<00:00, 203.84it/s]
 38%|███▊      | 62/162 [00:00<00:00, 196.14it/s]
 51%|█████     | 82/162 [00:00<00:00, 190.38it/s]
 63%|██████▎   | 102/162 [00:00<00:00, 186.52it/s]
 76%|███████▌  | 123/162 [00:00<00:00, 192.18it/s]
 90%|████████▉ | 145/162 [00:00<00:00, 199.23it/s]
100%|██████████| 162/162 [00:00<00:00, 189.42it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 647.88it/s]
 14%|█▎        | 22/162 [00:00<00:00, 215.78it/s]
 27%|██▋       | 44/162 [00:00<00:00, 208.09it/s]
 41%|████      | 66/162 [00:00<00:00, 212.90it/s]
 54%|█████▍    | 88/162 [00:00<00:00, 213.96it/s]
 69%|██████▊   | 1

[2m[36m(func pid=6080)[0m Epoch 00044: reducing learning rate of group 0 to 1.5242e-03.


 28%|██▊       | 45/162 [00:00<00:00, 220.44it/s]
 42%|████▏     | 68/162 [00:00<00:00, 219.98it/s]
 56%|█████▌    | 91/162 [00:00<00:00, 209.81it/s]
 70%|██████▉   | 113/162 [00:00<00:00, 210.82it/s]
 85%|████████▍ | 137/162 [00:00<00:00, 219.58it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 755.69it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 11%|█         | 18/162 [00:00<00:00, 174.10it/s]
 22%|██▏       | 36/162 [00:00<00:00, 175.74it/s]
 44%|████▍     | 72/162 [00:00<00:00, 175.46it/s]
 56%|█████▌    | 90/162 [00:00<00:00, 167.04it/s]
 69%|██████▊   | 111/162 [00:00<00:00, 180.32it/s]
 81%|████████  | 131/162 [00:00<00:00, 184.94it/s]
100%|██████████| 162/162 [00:00<00:00, 178.70it/s]
100%|██████████| 47/47 [00:00<00:00, 783.40it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 15%|█▍        | 24/162 [00:00<00:00, 229.09it/s]
 29%|██▉       | 47/162 [00:00<00:00, 199.57it/s]
 43%|████▎     | 69/162 [00:00<00:00, 208.07it/s]
 56%|█████▌    | 91/162 [00:

[2m[36m(func pid=6080)[0m Epoch 00064: reducing learning rate of group 0 to 3.8105e-04.


 27%|██▋       | 43/162 [00:00<00:00, 205.89it/s]
 40%|███▉      | 64/162 [00:00<00:00, 201.42it/s]
 66%|██████▌   | 107/162 [00:00<00:00, 208.70it/s]
 80%|███████▉  | 129/162 [00:00<00:00, 212.45it/s]
 94%|█████████▍| 152/162 [00:00<00:00, 217.46it/s]
100%|██████████| 162/162 [00:00<00:00, 208.79it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 639.95it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 12%|█▏        | 19/162 [00:00<00:00, 187.75it/s]
 23%|██▎       | 38/162 [00:00<00:00, 189.02it/s]
 36%|███▌      | 58/162 [00:00<00:00, 192.69it/s]
 48%|████▊     | 78/162 [00:00<00:00, 193.59it/s]
 62%|██████▏   | 100/162 [00:00<00:00, 201.24it/s]
 76%|███████▌  | 123/162 [00:00<00:00, 209.88it/s]
 90%|█████████ | 146/162 [00:00<00:00, 215.85it/s]
100%|██████████| 162/162 [00:00<00:00, 207.68it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 637.79it/s]
 13%|█▎        | 21/162 [00:00<00:00, 200.90it/s]
 26%|██▌       | 42/162 [0

[2m[36m(func pid=6080)[0m Epoch 00078: reducing learning rate of group 0 to 1.9053e-04.


 29%|██▉       | 47/162 [00:00<00:00, 235.19it/s]
 44%|████▍     | 71/162 [00:00<00:00, 236.14it/s]
 59%|█████▊    | 95/162 [00:00<00:00, 228.21it/s]
 73%|███████▎  | 118/162 [00:00<00:00, 227.39it/s]
 88%|████████▊ | 142/162 [00:00<00:00, 229.99it/s]
100%|██████████| 162/162 [00:00<00:00, 229.72it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 808.18it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 14%|█▍        | 23/162 [00:00<00:00, 225.61it/s]
 29%|██▉       | 47/162 [00:00<00:00, 232.38it/s]
 44%|████▍     | 71/162 [00:00<00:00, 231.64it/s]
 59%|█████▊    | 95/162 [00:00<00:00, 222.51it/s]
 73%|███████▎  | 118/162 [00:00<00:00, 215.55it/s]
 86%|████████▋ | 140/162 [00:00<00:00, 215.02it/s]
100%|██████████| 162/162 [00:00<00:00, 216.82it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 697.78it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 15%|█▍        | 24/162 [00:00<00:00, 232.44it/s]
 30%|██▉       | 48/162 [00:00<00:00, 

[2m[36m(func pid=6080)[0m Epoch 00089: reducing learning rate of group 0 to 9.5263e-05.


 14%|█▍        | 23/162 [00:00<00:00, 224.71it/s]
 28%|██▊       | 46/162 [00:00<00:00, 202.29it/s]
 41%|████▏     | 67/162 [00:00<00:00, 200.21it/s]
 56%|█████▌    | 90/162 [00:00<00:00, 209.68it/s]
 70%|███████   | 114/162 [00:00<00:00, 217.23it/s]
 84%|████████▍ | 136/162 [00:00<00:00, 214.16it/s]
100%|██████████| 162/162 [00:00<00:00, 209.80it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 579.29it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 14%|█▍        | 23/162 [00:00<00:00, 222.73it/s]
 28%|██▊       | 46/162 [00:00<00:00, 209.98it/s]
 42%|████▏     | 68/162 [00:00<00:00, 206.31it/s]
 55%|█████▍    | 89/162 [00:00<00:00, 198.18it/s]
 67%|██████▋   | 109/162 [00:00<00:00, 194.13it/s]
 80%|███████▉  | 129/162 [00:00<00:00, 188.80it/s]
 91%|█████████▏| 148/162 [00:00<00:00, 188.60it/s]
100%|██████████| 162/162 [00:00<00:00, 194.23it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 691.07it/s]
  0%|          | 0/162 [00:

[2m[36m(func pid=6080)[0m Epoch 00103: reducing learning rate of group 0 to 4.7631e-05.


 14%|█▎        | 22/162 [00:00<00:00, 217.61it/s]
 28%|██▊       | 45/162 [00:00<00:00, 219.60it/s]
 41%|████▏     | 67/162 [00:00<00:00, 206.57it/s]
 70%|███████   | 114/162 [00:00<00:00, 219.66it/s]
 85%|████████▍ | 137/162 [00:00<00:00, 222.99it/s]
100%|██████████| 162/162 [00:00<00:00, 220.00it/s]
100%|██████████| 47/47 [00:00<00:00, 710.59it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 15%|█▍        | 24/162 [00:00<00:00, 233.00it/s]
 30%|██▉       | 48/162 [00:00<00:00, 232.94it/s]
 44%|████▍     | 72/162 [00:00<00:00, 222.23it/s]
 59%|█████▊    | 95/162 [00:00<00:00, 220.22it/s]
 73%|███████▎  | 118/162 [00:00<00:00, 218.94it/s]
 86%|████████▋ | 140/162 [00:00<00:00, 218.65it/s]
100%|██████████| 162/162 [00:00<00:00, 221.84it/s]
100%|██████████| 47/47 [00:00<00:00, 824.43it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 15%|█▍        | 24/162 [00:00<00:00, 230.09it/s]
 44%|████▍     | 72/162 [00:00<00:00, 235.70it/s]
 59%|█████▉    | 96/162 [00:00<00:00, 232.60it/s]
 74%|███████▍  |

[2m[36m(func pid=6080)[0m Epoch 00109: reducing learning rate of group 0 to 2.3816e-05.


 12%|█▏        | 19/162 [00:00<00:00, 180.63it/s]
 23%|██▎       | 38/162 [00:00<00:00, 154.98it/s]
 36%|███▌      | 58/162 [00:00<00:00, 171.88it/s]
 49%|████▉     | 79/162 [00:00<00:00, 185.80it/s]
 62%|██████▏   | 101/162 [00:00<00:00, 194.70it/s]
 76%|███████▌  | 123/162 [00:00<00:00, 201.82it/s]
100%|██████████| 162/162 [00:00<00:00, 196.34it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 742.34it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 14%|█▎        | 22/162 [00:00<00:00, 219.57it/s]
 28%|██▊       | 45/162 [00:00<00:00, 224.54it/s]
 43%|████▎     | 70/162 [00:00<00:00, 232.50it/s]
 73%|███████▎  | 119/162 [00:00<00:00, 234.75it/s]
 88%|████████▊ | 143/162 [00:00<00:00, 225.97it/s]
100%|██████████| 162/162 [00:00<00:00, 226.85it/s]
100%|██████████| 47/47 [00:00<00:00, 722.28it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 14%|█▍        | 23/162 [00:00<00:00, 225.48it/s]
 28%|██▊       | 46/162 [00:00<00:00, 220.05it/s]
 43%|████▎     | 69/162 [00

[2m[36m(func pid=6080)[0m Epoch 00115: reducing learning rate of group 0 to 1.1908e-05.


 13%|█▎        | 21/162 [00:00<00:00, 207.31it/s]
 26%|██▌       | 42/162 [00:00<00:00, 196.33it/s]
 40%|████      | 65/162 [00:00<00:00, 207.09it/s]
 54%|█████▎    | 87/162 [00:00<00:00, 210.78it/s]
 67%|██████▋   | 109/162 [00:00<00:00, 213.24it/s]
 81%|████████  | 131/162 [00:00<00:00, 212.45it/s]
100%|██████████| 162/162 [00:00<00:00, 211.75it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 592.52it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 13%|█▎        | 21/162 [00:00<00:00, 205.56it/s]
 27%|██▋       | 44/162 [00:00<00:00, 217.94it/s]
 41%|████▏     | 67/162 [00:00<00:00, 222.80it/s]
 57%|█████▋    | 92/162 [00:00<00:00, 230.78it/s]
 72%|███████▏  | 116/162 [00:00<00:00, 229.23it/s]
100%|██████████| 162/162 [00:00<00:00, 229.14it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 757.70it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 15%|█▍        | 24/162 [00:00<00:00, 238.16it/s]
 30%|██▉       | 48/162 [00:00<00:00, 2

[2m[36m(func pid=6080)[0m Epoch 00121: reducing learning rate of group 0 to 5.9539e-06.


 25%|██▍       | 40/162 [00:00<00:00, 198.05it/s]
 38%|███▊      | 61/162 [00:00<00:00, 200.25it/s]
 51%|█████     | 82/162 [00:00<00:00, 183.32it/s]
 63%|██████▎   | 102/162 [00:00<00:00, 186.94it/s]
 76%|███████▌  | 123/162 [00:00<00:00, 192.62it/s]
 90%|████████▉ | 145/162 [00:00<00:00, 199.14it/s]
100%|██████████| 162/162 [00:00<00:00, 194.01it/s]
100%|██████████| 47/47 [00:00<00:00, 705.99it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 12%|█▏        | 20/162 [00:00<00:00, 199.81it/s]
 25%|██▍       | 40/162 [00:00<00:00, 194.63it/s]
 38%|███▊      | 61/162 [00:00<00:00, 200.67it/s]
 51%|█████     | 82/162 [00:00<00:00, 201.08it/s]
 64%|██████▎   | 103/162 [00:00<00:00, 198.72it/s]
 76%|███████▌  | 123/162 [00:00<00:00, 197.56it/s]
 89%|████████▉ | 144/162 [00:00<00:00, 197.80it/s]
100%|██████████| 47/47 [00:00<00:00, 569.43it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 22%|██▏       | 36/162 [00:00<00:00, 174.80it/s]
 33%|███▎      | 54/162 [00:00<00:00, 158.87it/s]
 45%|████▌     

[2m[36m(func pid=6080)[0m Epoch 00127: reducing learning rate of group 0 to 2.9770e-06.


 14%|█▍        | 23/162 [00:00<00:00, 223.17it/s]
 28%|██▊       | 46/162 [00:00<00:00, 226.17it/s]
 57%|█████▋    | 92/162 [00:00<00:00, 224.60it/s]
 71%|███████   | 115/162 [00:00<00:00, 214.98it/s]
 85%|████████▍ | 137/162 [00:00<00:00, 216.43it/s]
100%|██████████| 47/47 [00:00<00:00, 683.82it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 10%|█         | 17/162 [00:00<00:00, 164.90it/s]
 21%|██        | 34/162 [00:00<00:00, 167.56it/s]
 32%|███▏      | 52/162 [00:00<00:00, 170.22it/s]
 44%|████▍     | 72/162 [00:00<00:00, 177.60it/s]
 56%|█████▌    | 90/162 [00:00<00:00, 172.41it/s]
 68%|██████▊   | 110/162 [00:00<00:00, 179.63it/s]
 79%|███████▉  | 128/162 [00:00<00:00, 172.86it/s]
 90%|█████████ | 146/162 [00:00<00:00, 173.29it/s]
100%|██████████| 162/162 [00:00<00:00, 174.29it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 704.77it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 14%|█▍        | 23/162 [00:00<00:00, 220.73it/s]
 28%|██▊       | 46/162 [00

[2m[36m(func pid=6080)[0m Epoch 00133: reducing learning rate of group 0 to 1.4885e-06.


 10%|▉         | 16/162 [00:00<00:00, 157.01it/s]
 22%|██▏       | 35/162 [00:00<00:00, 174.70it/s]
 33%|███▎      | 54/162 [00:00<00:00, 179.92it/s]
 44%|████▍     | 72/162 [00:00<00:00, 179.20it/s]
 57%|█████▋    | 92/162 [00:00<00:00, 182.25it/s]
 69%|██████▉   | 112/162 [00:00<00:00, 186.88it/s]
 81%|████████▏ | 132/162 [00:00<00:00, 189.76it/s]
 93%|█████████▎| 151/162 [00:00<00:00, 181.90it/s]
100%|██████████| 162/162 [00:00<00:00, 182.12it/s]
100%|██████████| 47/47 [00:00<00:00, 515.55it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 14%|█▎        | 22/162 [00:00<00:00, 218.47it/s]
 27%|██▋       | 44/162 [00:00<00:00, 202.11it/s]
 40%|████      | 65/162 [00:00<00:00, 198.60it/s]
 54%|█████▍    | 88/162 [00:00<00:00, 207.99it/s]
 69%|██████▊   | 111/162 [00:00<00:00, 213.73it/s]
 83%|████████▎ | 135/162 [00:00<00:00, 220.33it/s]
100%|██████████| 162/162 [00:00<00:00, 214.88it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 718.95it/s]
  0%|          |

[2m[36m(func pid=6080)[0m Epoch 00139: reducing learning rate of group 0 to 7.4424e-07.


 26%|██▌       | 42/162 [00:00<00:00, 164.59it/s]
 38%|███▊      | 61/162 [00:00<00:00, 172.23it/s]
 51%|█████     | 82/162 [00:00<00:00, 185.48it/s]
 65%|██████▌   | 106/162 [00:00<00:00, 202.57it/s]
 80%|███████▉  | 129/162 [00:00<00:00, 210.72it/s]
100%|██████████| 162/162 [00:00<00:00, 202.01it/s]
100%|██████████| 47/47 [00:00<00:00, 812.87it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 14%|█▎        | 22/162 [00:00<00:00, 217.73it/s]
 28%|██▊       | 45/162 [00:00<00:00, 222.93it/s]
 42%|████▏     | 68/162 [00:00<00:00, 221.57it/s]
 56%|█████▌    | 91/162 [00:00<00:00, 218.18it/s]
 70%|███████   | 114/162 [00:00<00:00, 219.00it/s]
 85%|████████▍ | 137/162 [00:00<00:00, 219.76it/s]
100%|██████████| 162/162 [00:00<00:00, 218.85it/s]
100%|██████████| 47/47 [00:00<00:00, 836.29it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 15%|█▍        | 24/162 [00:00<00:00, 235.29it/s]
 30%|██▉       | 48/162 [00:00<00:00, 237.17it/s]
 44%|████▍     | 72/162 [00:00<00:00, 233.73it/s]
 60%|█████▉    |

[2m[36m(func pid=6080)[0m Epoch 00145: reducing learning rate of group 0 to 3.7212e-07.


 13%|█▎        | 21/162 [00:00<00:00, 200.86it/s]
 26%|██▌       | 42/162 [00:00<00:00, 200.50it/s]
 39%|███▉      | 63/162 [00:00<00:00, 204.70it/s]
 67%|██████▋   | 108/162 [00:00<00:00, 213.03it/s]
 81%|████████  | 131/162 [00:00<00:00, 218.44it/s]
100%|██████████| 162/162 [00:00<00:00, 214.62it/s]
  0%|          | 0/47 [00:00<?, ?it/s]
100%|██████████| 47/47 [00:00<00:00, 794.31it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 15%|█▍        | 24/162 [00:00<00:00, 239.46it/s]
 30%|██▉       | 48/162 [00:00<00:00, 231.81it/s]
 44%|████▍     | 72/162 [00:00<00:00, 233.50it/s]
 74%|███████▍  | 120/162 [00:00<00:00, 232.03it/s]
 89%|████████▉ | 144/162 [00:00<00:00, 231.69it/s]
100%|██████████| 162/162 [00:00<00:00, 233.08it/s]
100%|██████████| 47/47 [00:00<00:00, 665.85it/s]
  0%|          | 0/162 [00:00<?, ?it/s]
 14%|█▎        | 22/162 [00:00<00:00, 209.64it/s]
 28%|██▊       | 45/162 [00:00<00:00, 217.92it/s]
 42%|████▏     | 68/162 [00:00<00:00, 222.02it/s]
 56%|█████▌    | 91/162 [00

[2m[36m(func pid=24608)[0m Epoch 00028: reducing learning rate of group 0 to 3.4739e-02.


 26%|██▌       | 21/81 [00:00<00:00, 103.04it/s]
 41%|████      | 33/81 [00:00<00:00, 108.41it/s]
 54%|█████▍    | 44/81 [00:00<00:00, 105.02it/s]
 69%|██████▉   | 56/81 [00:00<00:00, 106.88it/s]
 85%|████████▌ | 69/81 [00:00<00:00, 114.09it/s]
100%|██████████| 81/81 [00:00<00:00, 106.88it/s]
100%|██████████| 24/24 [00:00<00:00, 443.71it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 17%|█▋        | 14/81 [00:00<00:00, 136.85it/s]
 36%|███▌      | 29/81 [00:00<00:00, 138.98it/s]
 53%|█████▎    | 43/81 [00:00<00:00, 137.01it/s]
 70%|███████   | 57/81 [00:00<00:00, 138.15it/s]
 88%|████████▊ | 71/81 [00:00<00:00, 135.90it/s]
100%|██████████| 81/81 [00:00<00:00, 138.10it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 407.52it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 17%|█▋        | 14/81 [00:00<00:00, 133.21it/s]
 35%|███▍      | 28/81 [00:00<00:00, 136.42it/s]
 53%|█████▎    | 43/81 [00:00<00:00, 140.02it/s]
 72%|███████▏  | 58/81 [00:00<00:00, 136.40it/s]
 

[2m[36m(func pid=24608)[0m Epoch 00058: reducing learning rate of group 0 to 1.7370e-02.


 19%|█▊        | 15/81 [00:00<00:00, 142.41it/s]
 37%|███▋      | 30/81 [00:00<00:00, 142.92it/s]
 56%|█████▌    | 45/81 [00:00<00:00, 133.68it/s]
 73%|███████▎  | 59/81 [00:00<00:00, 132.06it/s]
 91%|█████████▏| 74/81 [00:00<00:00, 137.66it/s]
100%|██████████| 24/24 [00:00<00:00, 480.31it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 16%|█▌        | 13/81 [00:00<00:00, 123.16it/s]
 32%|███▏      | 26/81 [00:00<00:00, 122.75it/s]
 48%|████▊     | 39/81 [00:00<00:00, 119.01it/s]
 65%|██████▌   | 53/81 [00:00<00:00, 125.65it/s]
 98%|█████████▊| 79/81 [00:00<00:00, 121.70it/s]
100%|██████████| 81/81 [00:00<00:00, 122.61it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 489.26it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 20%|█▉        | 16/81 [00:00<00:00, 152.42it/s]
 40%|███▉      | 32/81 [00:00<00:00, 145.74it/s]
 58%|█████▊    | 47/81 [00:00<00:00, 143.36it/s]
 78%|███████▊  | 63/81 [00:00<00:00, 149.03it/s]
100%|██████████| 81/81 [00:00<00:00, 144.87it/s]
 

[2m[36m(func pid=24608)[0m Epoch 00064: reducing learning rate of group 0 to 8.6849e-03.


 19%|█▊        | 15/81 [00:00<00:00, 140.00it/s]
 37%|███▋      | 30/81 [00:00<00:00, 141.65it/s]
 56%|█████▌    | 45/81 [00:00<00:00, 142.19it/s]
 94%|█████████▍| 76/81 [00:00<00:00, 144.32it/s]
100%|██████████| 81/81 [00:00<00:00, 141.12it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 376.40it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 16%|█▌        | 13/81 [00:00<00:00, 121.58it/s]
 32%|███▏      | 26/81 [00:00<00:00, 122.97it/s]
 48%|████▊     | 39/81 [00:00<00:00, 122.80it/s]
 65%|██████▌   | 53/81 [00:00<00:00, 126.84it/s]
 83%|████████▎ | 67/81 [00:00<00:00, 128.02it/s]
100%|██████████| 24/24 [00:00<00:00, 379.92it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 16%|█▌        | 13/81 [00:00<00:00, 123.31it/s]
 32%|███▏      | 26/81 [00:00<00:00, 110.72it/s]
 48%|████▊     | 39/81 [00:00<00:00, 115.07it/s]
 63%|██████▎   | 51/81 [00:00<00:00, 84.15it/s] 
 75%|███████▌  | 61/81 [00:00<00:00, 86.35it/s]
100%|██████████| 81/81 [00:00<00:00, 100.71it/s]
10

[2m[36m(func pid=24608)[0m Epoch 00070: reducing learning rate of group 0 to 4.3424e-03.


 17%|█▋        | 14/81 [00:00<00:00, 133.62it/s]
 35%|███▍      | 28/81 [00:00<00:00, 134.94it/s]
 52%|█████▏    | 42/81 [00:00<00:00, 132.82it/s]
 69%|██████▉   | 56/81 [00:00<00:00, 121.94it/s]
 89%|████████▉ | 72/81 [00:00<00:00, 132.40it/s]
100%|██████████| 81/81 [00:00<00:00, 131.80it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 443.76it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 19%|█▊        | 15/81 [00:00<00:00, 144.29it/s]
 37%|███▋      | 30/81 [00:00<00:00, 143.38it/s]
 56%|█████▌    | 45/81 [00:00<00:00, 140.82it/s]
 75%|███████▌  | 61/81 [00:00<00:00, 146.24it/s]
100%|██████████| 24/24 [00:00<00:00, 453.69it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 16%|█▌        | 13/81 [00:00<00:00, 125.11it/s]
 33%|███▎      | 27/81 [00:00<00:00, 128.24it/s]
 49%|████▉     | 40/81 [00:00<00:00, 124.74it/s]
 67%|██████▋   | 54/81 [00:00<00:00, 126.34it/s]
 83%|████████▎ | 67/81 [00:00<00:00, 123.96it/s]
100%|██████████| 81/81 [00:00<00:00, 128.61it/s]
 

[2m[36m(func pid=24608)[0m Epoch 00076: reducing learning rate of group 0 to 2.1712e-03.


 17%|█▋        | 14/81 [00:00<00:00, 139.71it/s]
 56%|█████▌    | 45/81 [00:00<00:00, 148.15it/s]
 75%|███████▌  | 61/81 [00:00<00:00, 150.46it/s]
100%|██████████| 81/81 [00:00<00:00, 149.42it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 184.28it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 17%|█▋        | 14/81 [00:00<00:00, 132.38it/s]
 36%|███▌      | 29/81 [00:00<00:00, 137.71it/s]
 54%|█████▍    | 44/81 [00:00<00:00, 140.25it/s]
 73%|███████▎  | 59/81 [00:00<00:00, 143.21it/s]
100%|██████████| 81/81 [00:00<00:00, 143.37it/s]
100%|██████████| 24/24 [00:00<00:00, 479.44it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 20%|█▉        | 16/81 [00:00<00:00, 150.89it/s]
 40%|███▉      | 32/81 [00:00<00:00, 151.04it/s]
 59%|█████▉    | 48/81 [00:00<00:00, 154.04it/s]
 79%|███████▉  | 64/81 [00:00<00:00, 153.88it/s]
100%|██████████| 24/24 [00:00<00:00, 469.59it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 16%|█▌        | 13/81 [00:00<00:00, 125.06it/s]
 32%|███▏  

[2m[36m(func pid=24608)[0m Epoch 00082: reducing learning rate of group 0 to 1.0856e-03.


 38%|███▊      | 31/81 [00:00<00:00, 150.99it/s]
 58%|█████▊    | 47/81 [00:00<00:00, 128.51it/s]
 77%|███████▋  | 62/81 [00:00<00:00, 133.20it/s]
100%|██████████| 81/81 [00:00<00:00, 135.64it/s]
100%|██████████| 24/24 [00:00<00:00, 498.77it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 20%|█▉        | 16/81 [00:00<00:00, 149.20it/s]
 38%|███▊      | 31/81 [00:00<00:00, 144.85it/s]
 75%|███████▌  | 61/81 [00:00<00:00, 143.98it/s]
 94%|█████████▍| 76/81 [00:00<00:00, 141.16it/s]
100%|██████████| 81/81 [00:00<00:00, 142.83it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 421.36it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 19%|█▊        | 15/81 [00:00<00:00, 148.78it/s]
 38%|███▊      | 31/81 [00:00<00:00, 152.68it/s]
 58%|█████▊    | 47/81 [00:00<00:00, 154.57it/s]
 78%|███████▊  | 63/81 [00:00<00:00, 154.72it/s]
100%|██████████| 81/81 [00:00<00:00, 154.05it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 497.62it/s]
  0%|      

[2m[36m(func pid=24608)[0m Epoch 00088: reducing learning rate of group 0 to 5.4280e-04.


  0%|          | 0/81 [00:00<?, ?it/s]
 17%|█▋        | 14/81 [00:00<00:00, 131.91it/s]
 36%|███▌      | 29/81 [00:00<00:00, 137.51it/s]
 53%|█████▎    | 43/81 [00:00<00:00, 125.87it/s]
 69%|██████▉   | 56/81 [00:00<00:00, 126.37it/s]
 86%|████████▋ | 70/81 [00:00<00:00, 130.58it/s]
100%|██████████| 81/81 [00:00<00:00, 131.32it/s]
100%|██████████| 24/24 [00:00<00:00, 453.96it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 20%|█▉        | 16/81 [00:00<00:00, 153.11it/s]
 40%|███▉      | 32/81 [00:00<00:00, 153.76it/s]
 59%|█████▉    | 48/81 [00:00<00:00, 149.16it/s]
 78%|███████▊  | 63/81 [00:00<00:00, 147.29it/s]
 96%|█████████▋| 78/81 [00:00<00:00, 146.38it/s]
100%|██████████| 81/81 [00:00<00:00, 147.78it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 460.22it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 20%|█▉        | 16/81 [00:00<00:00, 150.01it/s]
 40%|███▉      | 32/81 [00:00<00:00, 146.91it/s]
 58%|█████▊    | 47/81 [00:00<00:00, 145.72it/s]
 77%|██████

[2m[36m(func pid=24608)[0m Epoch 00094: reducing learning rate of group 0 to 2.7140e-04.


 19%|█▊        | 15/81 [00:00<00:00, 145.91it/s]
 37%|███▋      | 30/81 [00:00<00:00, 147.45it/s]
 74%|███████▍  | 60/81 [00:00<00:00, 147.75it/s]
 94%|█████████▍| 76/81 [00:00<00:00, 149.51it/s]
100%|██████████| 81/81 [00:00<00:00, 146.77it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 350.17it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 15%|█▍        | 12/81 [00:00<00:00, 109.90it/s]
 30%|██▉       | 24/81 [00:00<00:00, 111.82it/s]
 44%|████▍     | 36/81 [00:00<00:00, 112.82it/s]
 60%|██████    | 49/81 [00:00<00:00, 117.25it/s]
 79%|███████▉  | 64/81 [00:00<00:00, 127.80it/s]
100%|██████████| 81/81 [00:00<00:00, 124.37it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 455.62it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 19%|█▊        | 15/81 [00:00<00:00, 141.70it/s]
 37%|███▋      | 30/81 [00:00<00:00, 138.47it/s]
 56%|█████▌    | 45/81 [00:00<00:00, 140.41it/s]
 75%|███████▌  | 61/81 [00:00<00:00, 144.66it/s]
100%|██████

[2m[36m(func pid=24608)[0m Epoch 00100: reducing learning rate of group 0 to 1.3570e-04.


 17%|█▋        | 14/81 [00:00<00:00, 133.45it/s]
 35%|███▍      | 28/81 [00:00<00:00, 131.15it/s]
 52%|█████▏    | 42/81 [00:00<00:00, 134.46it/s]
 69%|██████▉   | 56/81 [00:00<00:00, 134.76it/s]
 86%|████████▋ | 70/81 [00:00<00:00, 133.53it/s]
100%|██████████| 24/24 [00:00<00:00, 438.45it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 28%|██▊       | 23/81 [00:00<00:00, 113.79it/s]
 43%|████▎     | 35/81 [00:00<00:00, 102.33it/s]
 58%|█████▊    | 47/81 [00:00<00:00, 108.24it/s]
 72%|███████▏  | 58/81 [00:00<00:00, 101.60it/s]
 89%|████████▉ | 72/81 [00:00<00:00, 111.26it/s]
100%|██████████| 81/81 [00:00<00:00, 110.80it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 417.26it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 17%|█▋        | 14/81 [00:00<00:00, 130.70it/s]
 35%|███▍      | 28/81 [00:00<00:00, 134.45it/s]
 52%|█████▏    | 42/81 [00:00<00:00, 132.67it/s]
 69%|██████▉   | 56/81 [00:00<00:00, 131.32it/s]
 86%|████████▋ | 70/81 [00:00<00:00, 129.81it/s]
1

[2m[36m(func pid=24608)[0m Epoch 00106: reducing learning rate of group 0 to 6.7850e-05.


 36%|███▌      | 29/81 [00:00<00:00, 139.17it/s]
 53%|█████▎    | 43/81 [00:00<00:00, 123.49it/s]
 70%|███████   | 57/81 [00:00<00:00, 127.26it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 359.51it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 16%|█▌        | 13/81 [00:00<00:00, 125.67it/s]
 35%|███▍      | 28/81 [00:00<00:00, 131.35it/s]
 52%|█████▏    | 42/81 [00:00<00:00, 121.67it/s]
 68%|██████▊   | 55/81 [00:00<00:00, 115.28it/s]
100%|██████████| 81/81 [00:00<00:00, 125.27it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 189.90it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 40%|███▉      | 32/81 [00:00<00:00, 154.08it/s]
 59%|█████▉    | 48/81 [00:00<00:00, 154.73it/s]
 79%|███████▉  | 64/81 [00:00<00:00, 155.94it/s]
100%|██████████| 81/81 [00:00<00:00, 153.96it/s]
100%|██████████| 24/24 [00:00<00:00, 499.33it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 19%|█▊        | 15/81 [00:00<00:00, 149.93it/s]
 38%|███▊      | 31/8

[2m[36m(func pid=24608)[0m Epoch 00112: reducing learning rate of group 0 to 3.3925e-05.


 37%|███▋      | 30/81 [00:00<00:00, 141.91it/s]
 56%|█████▌    | 45/81 [00:00<00:00, 125.60it/s]
 73%|███████▎  | 59/81 [00:00<00:00, 128.60it/s]
100%|██████████| 81/81 [00:00<00:00, 137.46it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 16%|█▌        | 13/81 [00:00<00:00, 129.78it/s]
 32%|███▏      | 26/81 [00:00<00:00, 123.24it/s]
 51%|█████     | 41/81 [00:00<00:00, 129.54it/s]
 67%|██████▋   | 54/81 [00:00<00:00, 122.42it/s]
 84%|████████▍ | 68/81 [00:00<00:00, 126.00it/s]
100%|██████████| 81/81 [00:00<00:00, 121.13it/s]
100%|██████████| 24/24 [00:00<00:00, 436.02it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 37%|███▋      | 30/81 [00:00<00:00, 137.79it/s]
 54%|█████▍    | 44/81 [00:00<00:00, 135.16it/s]
 73%|███████▎  | 59/81 [00:00<00:00, 140.07it/s]
100%|██████████| 81/81 [00:00<00:00, 139.05it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 487.56it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 19%|█▊        | 15/81 [00:00<00:00, 149.39it/s]
 38%|███▊  

[2m[36m(func pid=24608)[0m Epoch 00118: reducing learning rate of group 0 to 1.6963e-05.


 16%|█▌        | 13/81 [00:00<00:00, 126.21it/s]
 32%|███▏      | 26/81 [00:00<00:00, 85.06it/s] 
 49%|████▉     | 40/81 [00:00<00:00, 101.61it/s]
 63%|██████▎   | 51/81 [00:00<00:00, 101.12it/s]
 81%|████████▏ | 66/81 [00:00<00:00, 114.93it/s]
100%|██████████| 81/81 [00:00<00:00, 114.14it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 410.09it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 19%|█▊        | 15/81 [00:00<00:00, 143.01it/s]
 37%|███▋      | 30/81 [00:00<00:00, 130.29it/s]
 54%|█████▍    | 44/81 [00:00<00:00, 131.97it/s]
 73%|███████▎  | 59/81 [00:00<00:00, 135.81it/s]
100%|██████████| 24/24 [00:00<00:00, 429.49it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 17%|█▋        | 14/81 [00:00<00:00, 134.84it/s]
 35%|███▍      | 28/81 [00:00<00:00, 126.17it/s]
 52%|█████▏    | 42/81 [00:00<00:00, 131.40it/s]
 69%|██████▉   | 56/81 [00:00<00:00, 118.95it/s]
 86%|████████▋ | 70/81 [00:00<00:00, 123.18it/s]
100%|██████████| 81/81 [00:00<00:00, 127.72it/s]
1

[2m[36m(func pid=24608)[0m Epoch 00136: reducing learning rate of group 0 to 2.1203e-06.


 40%|███▉      | 32/81 [00:00<00:00, 152.50it/s]
 59%|█████▉    | 48/81 [00:00<00:00, 149.73it/s]
 78%|███████▊  | 63/81 [00:00<00:00, 140.21it/s]
100%|██████████| 24/24 [00:00<00:00, 414.41it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 15%|█▍        | 12/81 [00:00<00:00, 118.50it/s]
 30%|██▉       | 24/81 [00:00<00:00, 102.68it/s]
 46%|████▌     | 37/81 [00:00<00:00, 111.82it/s]
 60%|██████    | 49/81 [00:00<00:00, 107.19it/s]
 77%|███████▋  | 62/81 [00:00<00:00, 112.61it/s]
 91%|█████████▏| 74/81 [00:00<00:00, 110.06it/s]
100%|██████████| 81/81 [00:00<00:00, 111.87it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 430.28it/s]
 17%|█▋        | 14/81 [00:00<00:00, 132.29it/s]
 35%|███▍      | 28/81 [00:00<00:00, 130.58it/s]
 52%|█████▏    | 42/81 [00:00<00:00, 128.89it/s]
 69%|██████▉   | 56/81 [00:00<00:00, 132.62it/s]
100%|██████████| 81/81 [00:00<00:00, 132.08it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 138.92it/s]
 

[2m[36m(func pid=24608)[0m Epoch 00142: reducing learning rate of group 0 to 1.0602e-06.


 16%|█▌        | 13/81 [00:00<00:00, 126.28it/s]
 32%|███▏      | 26/81 [00:00<00:00, 125.69it/s]
 48%|████▊     | 39/81 [00:00<00:00, 125.13it/s]
 65%|██████▌   | 53/81 [00:00<00:00, 130.06it/s]
100%|██████████| 24/24 [00:00<00:00, 420.53it/s]
 14%|█▎        | 11/81 [00:00<00:00, 107.06it/s]
 32%|███▏      | 26/81 [00:00<00:00, 127.43it/s]
 48%|████▊     | 39/81 [00:00<00:00, 114.39it/s]
 63%|██████▎   | 51/81 [00:00<00:00, 115.18it/s]
 78%|███████▊  | 63/81 [00:00<00:00, 115.28it/s]
100%|██████████| 81/81 [00:00<00:00, 121.46it/s]
100%|██████████| 24/24 [00:00<00:00, 494.30it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 17%|█▋        | 14/81 [00:00<00:00, 138.36it/s]
 37%|███▋      | 30/81 [00:00<00:00, 146.99it/s]
 57%|█████▋    | 46/81 [00:00<00:00, 148.80it/s]
 75%|███████▌  | 61/81 [00:00<00:00, 148.72it/s]
100%|██████████| 24/24 [00:00<00:00, 340.69it/s]
  0%|          | 0/81 [00:00<?, ?it/s]
 15%|█▍        | 12/81 [00:00<00:00, 118.88it/s]
 32%|███▏      | 26/81 [00:00<00:00, 128

[2m[36m(func pid=24608)[0m Epoch 00148: reducing learning rate of group 0 to 5.3008e-07.


 40%|███▉      | 32/81 [00:00<00:00, 153.00it/s]
 59%|█████▉    | 48/81 [00:00<00:00, 152.75it/s]
 79%|███████▉  | 64/81 [00:00<00:00, 148.36it/s]
100%|██████████| 81/81 [00:00<00:00, 150.26it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
 17%|█▋        | 14/81 [00:00<00:00, 129.44it/s]
 33%|███▎      | 27/81 [00:00<00:00, 128.50it/s]
 49%|████▉     | 40/81 [00:00<00:00, 92.34it/s] 
 80%|████████  | 65/81 [00:00<00:00, 108.04it/s]
 96%|█████████▋| 78/81 [00:00<00:00, 113.58it/s]
100%|██████████| 81/81 [00:00<00:00, 110.16it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:01, 27.21it/s]
 44%|████▍     | 18/41 [00:00<00:00, 46.33it/s]
100%|██████████| 12/12 [00:00<00:00, 185.33it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 84.21it/s]
 44%|████▍     | 18/41 [00:00<00:00, 80.46it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 80.86it/s]
 88%|████████▊ | 36/41 [00:00<00:00, 81.29it/s]
100%|██████████| 41

[2m[36m(func pid=17800)[0m Epoch 00051: reducing learning rate of group 0 to 1.6860e-03.


 24%|██▍       | 10/41 [00:00<00:00, 93.56it/s]
 49%|████▉     | 20/41 [00:00<00:00, 92.72it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 93.33it/s]
100%|██████████| 41/41 [00:00<00:00, 92.80it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 189.89it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 95.68it/s]
 49%|████▉     | 20/41 [00:00<00:00, 93.48it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 92.21it/s]
100%|██████████| 41/41 [00:00<00:00, 93.33it/s]
100%|██████████| 12/12 [00:00<00:00, 193.12it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 20%|█▉        | 8/41 [00:00<00:00, 75.54it/s]
 41%|████▏     | 17/41 [00:00<00:00, 81.88it/s]
100%|██████████| 41/41 [00:00<00:00, 86.47it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 188.16it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 86.59it/s]
 44%|████▍     | 18/41 [00:00<00:00, 84.12it/s]
 66%|██████▌   | 27/41 [00:00<00:00,

[2m[36m(func pid=17800)[0m Epoch 00057: reducing learning rate of group 0 to 8.4299e-04.


 22%|██▏       | 9/41 [00:00<00:00, 49.71it/s]
 44%|████▍     | 18/41 [00:00<00:00, 67.21it/s]
100%|██████████| 12/12 [00:00<00:00, 181.95it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 89.08it/s]
 44%|████▍     | 18/41 [00:00<00:00, 87.93it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 85.86it/s]
100%|██████████| 41/41 [00:00<00:00, 87.59it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 200.16it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 84.23it/s]
 44%|████▍     | 18/41 [00:00<00:00, 82.87it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 80.45it/s]
100%|██████████| 41/41 [00:00<00:00, 82.60it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 149.66it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 84.32it/s]
 44%|████▍     | 18/41 [00:00<00:00, 77.02it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 78.77it/s]
  0%|          | 0/41 [00:00<?, ?it/s]

[2m[36m(func pid=17800)[0m Epoch 00072: reducing learning rate of group 0 to 4.2149e-04.


 17%|█▋        | 7/41 [00:00<00:00, 35.37it/s]
 56%|█████▌    | 23/41 [00:00<00:00, 61.57it/s]
 76%|███████▌  | 31/41 [00:00<00:00, 65.57it/s]
100%|██████████| 41/41 [00:00<00:00, 61.47it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 159.76it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 87.06it/s]
 44%|████▍     | 18/41 [00:00<00:00, 83.13it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 82.55it/s]
100%|██████████| 41/41 [00:00<00:00, 83.30it/s]
100%|██████████| 12/12 [00:00<00:00, 170.78it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 82.74it/s]
 44%|████▍     | 18/41 [00:00<00:00, 85.74it/s]
100%|██████████| 12/12 [00:00<00:00, 179.39it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 82.06it/s]
 44%|████▍     | 18/41 [00:00<00:00, 85.51it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 82.31it/s]
 88%|████████▊ | 36/41 [00:00<00:00, 83.65it/s]
100%|██████████| 41/41 [00:00

[2m[36m(func pid=17800)[0m Epoch 00137: reducing learning rate of group 0 to 5.2687e-05.


 44%|████▍     | 18/41 [00:00<00:00, 87.43it/s]
 68%|██████▊   | 28/41 [00:00<00:00, 89.95it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 71.67it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 20%|█▉        | 8/41 [00:00<00:00, 79.39it/s]
 39%|███▉      | 16/41 [00:00<00:00, 79.25it/s]
 61%|██████    | 25/41 [00:00<00:00, 80.53it/s]
 83%|████████▎ | 34/41 [00:00<00:00, 82.34it/s]
100%|██████████| 41/41 [00:00<00:00, 84.02it/s]
100%|██████████| 12/12 [00:00<00:00, 200.93it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 90.11it/s]
 49%|████▉     | 20/41 [00:00<00:00, 90.62it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 91.42it/s]
100%|██████████| 41/41 [00:00<00:00, 92.73it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 191.10it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 85.25it/s]
 44%|████▍     | 18/41 [00:00<00:00, 86.29it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 

  0%|          | 0/41 [00:00<?, ?it/s]
  2%|▏         | 1/41 [00:00<00:11,  3.50it/s]
 24%|██▍       | 10/41 [00:00<00:00, 32.22it/s]
 46%|████▋     | 19/41 [00:00<00:00, 50.65it/s]
 68%|██████▊   | 28/41 [00:00<00:00, 61.64it/s]
100%|██████████| 41/41 [00:00<00:00, 56.40it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 162.28it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 85.99it/s]
 44%|████▍     | 18/41 [00:00<00:00, 86.73it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 84.49it/s]
100%|██████████| 41/41 [00:00<00:00, 88.23it/s]
100%|██████████| 12/12 [00:00<00:00, 214.10it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 12%|█▏        | 5/41 [00:00<00:00, 38.60it/s]
 56%|█████▌    | 23/41 [00:00<00:00, 75.26it/s]
 80%|████████  | 33/41 [00:00<00:00, 82.10it/s]
100%|██████████| 41/41 [00:00<00:00, 78.03it/s]
100%|██████████| 12/12 [00:00<00:00, 218.72it/s]
 27%|██▋       | 11/41 [00:00<00:00, 100.77it/s]
 54%|█████▎    | 22/41 [00:

[2m[36m(func pid=5692)[0m Epoch 00042: reducing learning rate of group 0 to 4.8084e-03.


 22%|██▏       | 9/41 [00:00<00:00, 84.87it/s]
 44%|████▍     | 18/41 [00:00<00:00, 58.78it/s]
 68%|██████▊   | 28/41 [00:00<00:00, 72.83it/s]
100%|██████████| 41/41 [00:00<00:00, 78.26it/s]
100%|██████████| 12/12 [00:00<00:00, 222.00it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 94.25it/s]
 49%|████▉     | 20/41 [00:00<00:00, 94.79it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 95.40it/s]
100%|██████████| 41/41 [00:00<00:00, 96.79it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 226.83it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 98.93it/s]
 51%|█████     | 21/41 [00:00<00:00, 100.75it/s]
100%|██████████| 41/41 [00:00<00:00, 100.95it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 173.57it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 86.03it/s]
 44%|████▍     | 18/41 [00:00<00:00, 83.56it/s]
 68%|██████▊   | 28/41 [00:00<00:0

[2m[36m(func pid=5692)[0m Epoch 00057: reducing learning rate of group 0 to 2.4042e-03.


 51%|█████     | 21/41 [00:00<00:00, 98.48it/s]
 76%|███████▌  | 31/41 [00:00<00:00, 90.39it/s]
100%|██████████| 41/41 [00:00<00:00, 94.23it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
 83%|████████▎ | 10/12 [00:00<00:00, 79.71it/s]
100%|██████████| 12/12 [00:00<00:00, 90.47it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 92.65it/s]
 49%|████▉     | 20/41 [00:00<00:00, 89.60it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 92.88it/s]
100%|██████████| 41/41 [00:00<00:00, 93.09it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 199.50it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 27%|██▋       | 11/41 [00:00<00:00, 99.37it/s]
 54%|█████▎    | 22/41 [00:00<00:00, 100.35it/s]
 80%|████████  | 33/41 [00:00<00:00, 97.22it/s] 
100%|██████████| 41/41 [00:00<00:00, 97.67it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 210.37it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 27%|██▋       | 11/41 [00:00<00:00, 101.0

[2m[36m(func pid=5692)[0m Epoch 00069: reducing learning rate of group 0 to 1.2021e-03.


 22%|██▏       | 9/41 [00:00<00:00, 89.16it/s]
 44%|████▍     | 18/41 [00:00<00:00, 82.94it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 84.40it/s]
100%|██████████| 41/41 [00:00<00:00, 79.76it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 176.83it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 89.08it/s]
 44%|████▍     | 18/41 [00:00<00:00, 87.68it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 88.65it/s]
100%|██████████| 41/41 [00:00<00:00, 87.96it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 20%|█▉        | 8/41 [00:00<00:00, 76.77it/s]
 41%|████▏     | 17/41 [00:00<00:00, 80.76it/s]
 63%|██████▎   | 26/41 [00:00<00:00, 79.51it/s]
 85%|████████▌ | 35/41 [00:00<00:00, 82.55it/s]
100%|██████████| 41/41 [00:00<00:00, 82.81it/s]
100%|██████████| 12/12 [00:00<00:00, 165.76it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 88.20it/s]
 44%|████▍     | 18/41 [00:00<00:00, 86.66it/s]
 66%|██████▌   | 27/41 [00:00<

[2m[36m(func pid=5692)[0m Epoch 00075: reducing learning rate of group 0 to 6.0105e-04.


 46%|████▋     | 19/41 [00:00<00:00, 89.31it/s]
 71%|███████   | 29/41 [00:00<00:00, 90.45it/s]
100%|██████████| 12/12 [00:00<00:00, 190.59it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 20%|█▉        | 8/41 [00:00<00:00, 70.64it/s]
 61%|██████    | 25/41 [00:00<00:00, 77.53it/s]
 83%|████████▎ | 34/41 [00:00<00:00, 81.16it/s]
100%|██████████| 41/41 [00:00<00:00, 79.87it/s]
100%|██████████| 12/12 [00:00<00:00, 220.10it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 90.74it/s]
 49%|████▉     | 20/41 [00:00<00:00, 89.96it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 92.77it/s]
100%|██████████| 41/41 [00:00<00:00, 92.86it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 84.04it/s]
 46%|████▋     | 19/41 [00:00<00:00, 89.62it/s]
 68%|██████▊   | 28/41 [00:00<00:00, 88.95it/s]
 93%|█████████▎| 38/41 [00:00<00:00, 89.76it/s]
100%|██████████| 41/41 [00:00<00:00, 88.16it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:0

[2m[36m(func pid=5692)[0m Epoch 00081: reducing learning rate of group 0 to 3.0053e-04.


 27%|██▋       | 11/41 [00:00<00:00, 102.09it/s]
 54%|█████▎    | 22/41 [00:00<00:00, 94.91it/s] 
 78%|███████▊  | 32/41 [00:00<00:00, 95.74it/s]
100%|██████████| 41/41 [00:00<00:00, 97.92it/s]
100%|██████████| 12/12 [00:00<00:00, 230.19it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 97.29it/s]
 76%|███████▌  | 31/41 [00:00<00:00, 97.89it/s]
100%|██████████| 41/41 [00:00<00:00, 99.10it/s]
100%|██████████| 12/12 [00:00<00:00, 216.52it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
  7%|▋         | 3/41 [00:00<00:01, 27.69it/s]
 32%|███▏      | 13/41 [00:00<00:00, 68.72it/s]
 56%|█████▌    | 23/41 [00:00<00:00, 82.38it/s]
 80%|████████  | 33/41 [00:00<00:00, 88.90it/s]
100%|██████████| 12/12 [00:00<00:00, 183.86it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 86.53it/s]
 46%|████▋     | 19/41 [00:00<00:00, 89.05it/s]
 68%|██████▊   | 28/41 [00:00<00:00, 85.55it/s]
 93%|█████████▎| 38/41 [00:00<00:00, 87.44it/s]
100%|██████████|

[2m[36m(func pid=5692)[0m Epoch 00087: reducing learning rate of group 0 to 1.5026e-04.


 24%|██▍       | 10/41 [00:00<00:00, 98.53it/s]
 49%|████▉     | 20/41 [00:00<00:00, 90.08it/s]
 98%|█████████▊| 40/41 [00:00<00:00, 94.13it/s]
100%|██████████| 41/41 [00:00<00:00, 93.85it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 188.43it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 15%|█▍        | 6/41 [00:00<00:00, 41.40it/s]
 39%|███▉      | 16/41 [00:00<00:00, 69.76it/s]
 63%|██████▎   | 26/41 [00:00<00:00, 79.65it/s]
100%|██████████| 41/41 [00:00<00:00, 81.69it/s]
100%|██████████| 12/12 [00:00<00:00, 229.15it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 99.90it/s]
 78%|███████▊  | 32/41 [00:00<00:00, 101.53it/s]
100%|██████████| 41/41 [00:00<00:00, 100.45it/s]
100%|██████████| 12/12 [00:00<00:00, 216.11it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 99.57it/s]
 51%|█████     | 21/41 [00:00<00:00, 101.77it/s]
100%|██████████| 41/41 [00:00<00:00, 99.52it/s] 
  0%|          | 0/12 

[2m[36m(func pid=5692)[0m Epoch 00093: reducing learning rate of group 0 to 7.5131e-05.


 24%|██▍       | 10/41 [00:00<00:00, 98.01it/s]
 49%|████▉     | 20/41 [00:00<00:00, 97.63it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 190.10it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 20%|█▉        | 8/41 [00:00<00:00, 72.19it/s]
 44%|████▍     | 18/41 [00:00<00:00, 84.02it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 80.66it/s]
100%|██████████| 41/41 [00:00<00:00, 83.02it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 215.53it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 95.15it/s]
 49%|████▉     | 20/41 [00:00<00:00, 95.26it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 94.79it/s]
100%|██████████| 41/41 [00:00<00:00, 95.11it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 223.44it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 27%|██▋       | 11/41 [00:00<00:00, 100.20it/s]
 54%|█████▎    | 22/41 [00:00<00:00, 97.99it/s] 
 78%|███████▊  | 32/41 [00:00<00:00, 97.58

[2m[36m(func pid=5692)[0m Epoch 00099: reducing learning rate of group 0 to 3.7566e-05.


 49%|████▉     | 20/41 [00:00<00:00, 91.97it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 92.17it/s]
100%|██████████| 12/12 [00:00<00:00, 208.89it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 92.63it/s]
 49%|████▉     | 20/41 [00:00<00:00, 85.00it/s]
 95%|█████████▌| 39/41 [00:00<00:00, 86.75it/s]
100%|██████████| 41/41 [00:00<00:00, 87.03it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 212.15it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 27%|██▋       | 11/41 [00:00<00:00, 99.33it/s]
 51%|█████     | 21/41 [00:00<00:00, 98.64it/s]
 76%|███████▌  | 31/41 [00:00<00:00, 99.22it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 179.23it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 82.14it/s]
 46%|████▋     | 19/41 [00:00<00:00, 89.86it/s]
 71%|███████   | 29/41 [00:00<00:00, 86.71it/s]
100%|██████████| 41/41 [00:00<00:00, 86.83it/s]
  0%|          | 0/12 [00:00<?, ?it

[2m[36m(func pid=5692)[0m Epoch 00105: reducing learning rate of group 0 to 1.8783e-05.


 24%|██▍       | 10/41 [00:00<00:00, 99.05it/s]
 51%|█████     | 21/41 [00:00<00:00, 100.33it/s]
100%|██████████| 41/41 [00:00<00:00, 99.87it/s] 
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 230.38it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 97.27it/s]
 49%|████▉     | 20/41 [00:00<00:00, 98.23it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 96.83it/s]
 98%|█████████▊| 40/41 [00:00<00:00, 95.50it/s]
100%|██████████| 41/41 [00:00<00:00, 96.63it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 203.50it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 99.06it/s]
 49%|████▉     | 20/41 [00:00<00:00, 99.04it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 179.95it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 84.90it/s]
 46%|████▋     | 19/41 [00:00<00:00, 89.92it/s]
 68%|██████▊   | 28/41 [00:00<00:00, 89.86

[2m[36m(func pid=5692)[0m Epoch 00111: reducing learning rate of group 0 to 9.3914e-06.


 24%|██▍       | 10/41 [00:00<00:00, 96.59it/s]
 49%|████▉     | 20/41 [00:00<00:00, 92.86it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 88.63it/s]
100%|██████████| 41/41 [00:00<00:00, 92.73it/s]
100%|██████████| 12/12 [00:00<00:00, 223.34it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 95.34it/s]
 51%|█████     | 21/41 [00:00<00:00, 98.16it/s]
100%|██████████| 41/41 [00:00<00:00, 100.12it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 86.83it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 95.46it/s]
 51%|█████     | 21/41 [00:00<00:00, 98.64it/s]
 78%|███████▊  | 32/41 [00:00<00:00, 100.07it/s]
100%|██████████| 41/41 [00:00<00:00, 99.97it/s] 
100%|██████████| 12/12 [00:00<00:00, 218.46it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 95.08it/s]
 49%|████▉     | 20/41 [00:00<00:00, 94.77it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 93.65it/s]
100%|██████████| 41/41 

[2m[36m(func pid=5692)[0m Epoch 00123: reducing learning rate of group 0 to 2.3479e-06.


 22%|██▏       | 9/41 [00:00<00:00, 86.44it/s]
 46%|████▋     | 19/41 [00:00<00:00, 89.50it/s]
 68%|██████▊   | 28/41 [00:00<00:00, 86.31it/s]
100%|██████████| 41/41 [00:00<00:00, 89.32it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 215.79it/s]
 24%|██▍       | 10/41 [00:00<00:00, 99.12it/s]
 49%|████▉     | 20/41 [00:00<00:00, 94.04it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 93.29it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 157.89it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 20%|█▉        | 8/41 [00:00<00:00, 78.50it/s]
 41%|████▏     | 17/41 [00:00<00:00, 84.60it/s]
 63%|██████▎   | 26/41 [00:00<00:00, 84.21it/s]
 85%|████████▌ | 35/41 [00:00<00:00, 86.44it/s]
100%|██████████| 41/41 [00:00<00:00, 86.92it/s]
100%|██████████| 12/12 [00:00<00:00, 212.49it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 97.77it/s]
 49%|████▉     | 20/41 [00:00<00:00, 98.69it/s]
 73%|███████▎  | 30/41 [00:

[2m[36m(func pid=5692)[0m Epoch 00129: reducing learning rate of group 0 to 1.1739e-06.


 27%|██▋       | 11/41 [00:00<00:00, 100.02it/s]
 54%|█████▎    | 22/41 [00:00<00:00, 89.92it/s] 
100%|██████████| 41/41 [00:00<00:00, 92.70it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 193.28it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 93.41it/s]
 49%|████▉     | 20/41 [00:00<00:00, 92.90it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 95.21it/s]
100%|██████████| 12/12 [00:00<00:00, 200.16it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 82.52it/s]
 46%|████▋     | 19/41 [00:00<00:00, 88.25it/s]
 68%|██████▊   | 28/41 [00:00<00:00, 84.89it/s]
100%|██████████| 41/41 [00:00<00:00, 86.90it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 208.87it/s]
[2m[36m(func pid=5692)[0m 
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 96.90it/s]
 49%|████▉     | 20/41 [00:00<00:00, 98.18it/s]
100%|██████████| 41/41 [00:00<00:00, 98.50it/s]
  0

[2m[36m(func pid=5692)[0m Epoch 00135: reducing learning rate of group 0 to 5.8696e-07.


  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 97.87it/s]
 49%|████▉     | 20/41 [00:00<00:00, 91.11it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 89.61it/s]
 98%|█████████▊| 40/41 [00:00<00:00, 90.71it/s]
100%|██████████| 41/41 [00:00<00:00, 91.48it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 218.56it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 97.75it/s]
 49%|████▉     | 20/41 [00:00<00:00, 94.74it/s]
 73%|███████▎  | 30/41 [00:00<00:00, 94.38it/s]
100%|██████████| 41/41 [00:00<00:00, 94.90it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 214.55it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 27%|██▋       | 11/41 [00:00<00:00, 100.45it/s]
 54%|█████▎    | 22/41 [00:00<00:00, 101.82it/s]
 80%|████████  | 33/41 [00:00<00:00, 101.43it/s]
100%|██████████| 41/41 [00:00<00:00, 100.61it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 225

[2m[36m(func pid=5692)[0m Epoch 00141: reducing learning rate of group 0 to 2.9348e-07.


 24%|██▍       | 10/41 [00:00<00:00, 92.92it/s]
 49%|████▉     | 20/41 [00:00<00:00, 87.16it/s]
 95%|█████████▌| 39/41 [00:00<00:00, 85.87it/s]
100%|██████████| 41/41 [00:00<00:00, 87.01it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 222.88it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 27%|██▋       | 11/41 [00:00<00:00, 102.46it/s]
 54%|█████▎    | 22/41 [00:00<00:00, 99.21it/s] 
 80%|████████  | 33/41 [00:00<00:00, 99.39it/s]
100%|██████████| 41/41 [00:00<00:00, 99.14it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
 33%|███▎      | 4/12 [00:00<00:00, 37.88it/s]
100%|██████████| 12/12 [00:00<00:00, 82.73it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 24%|██▍       | 10/41 [00:00<00:00, 94.35it/s]
 51%|█████     | 21/41 [00:00<00:00, 98.18it/s]
 76%|███████▌  | 31/41 [00:00<00:00, 98.53it/s]
100%|██████████| 41/41 [00:00<00:00, 98.47it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 200.70it/s]
  0%|          | 0/41 [00:00<?, ?i

[2m[36m(func pid=5692)[0m Epoch 00147: reducing learning rate of group 0 to 1.4674e-07.


 24%|██▍       | 10/41 [00:00<00:00, 89.24it/s]
 46%|████▋     | 19/41 [00:00<00:00, 81.39it/s]
 71%|███████   | 29/41 [00:00<00:00, 87.69it/s]
100%|██████████| 41/41 [00:00<00:00, 86.66it/s]
100%|██████████| 12/12 [00:00<00:00, 235.24it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 10%|▉         | 4/41 [00:00<00:01, 33.39it/s]
 34%|███▍      | 14/41 [00:00<00:00, 68.82it/s]
 61%|██████    | 25/41 [00:00<00:00, 83.86it/s]
 85%|████████▌ | 35/41 [00:00<00:00, 89.57it/s]
100%|██████████| 41/41 [00:00<00:00, 84.09it/s]
  0%|          | 0/12 [00:00<?, ?it/s]
100%|██████████| 12/12 [00:00<00:00, 176.20it/s]
  0%|          | 0/41 [00:00<?, ?it/s]
 22%|██▏       | 9/41 [00:00<00:00, 81.21it/s]
 44%|████▍     | 18/41 [00:00<00:00, 83.72it/s]
 66%|██████▌   | 27/41 [00:00<00:00, 85.72it/s]
100%|██████████| 41/41 [00:00<00:00, 85.95it/s]
100%|██████████| 12/12 [00:00<00:00, 210.12it/s]
100%|██████████| 6/6 [00:00<00:00, 171.22it/s]
[2m[36m(func pid=21400)[0m   self.obj[key] = value
  0%|        

[2m[36m(func pid=21400)[0m Epoch 00010: reducing learning rate of group 0 to 2.3223e-04.


 35%|███▍      | 29/83 [00:00<00:00, 141.37it/s]
 53%|█████▎    | 44/83 [00:00<00:00, 142.25it/s]
 71%|███████   | 59/83 [00:00<00:00, 139.35it/s]
100%|██████████| 83/83 [00:00<00:00, 139.34it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 289.16it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 18%|█▊        | 15/83 [00:00<00:00, 146.97it/s]
 37%|███▋      | 31/83 [00:00<00:00, 151.87it/s]
 57%|█████▋    | 47/83 [00:00<00:00, 150.84it/s]
 76%|███████▌  | 63/83 [00:00<00:00, 149.11it/s]
100%|██████████| 83/83 [00:00<00:00, 148.19it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 295.05it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 17%|█▋        | 14/83 [00:00<00:00, 139.77it/s]
 34%|███▎      | 28/83 [00:00<00:00, 138.82it/s]
 52%|█████▏    | 43/83 [00:00<00:00, 143.25it/s]
 71%|███████   | 59/83 [00:00<00:00, 148.99it/s]
 90%|█████████ | 75/83 [00:00<00:00, 150.76it/s]
100%|██████████| 83/83 [00:00<00:00, 147.96it/s]
  0%|      

[2m[36m(func pid=21400)[0m Epoch 00018: reducing learning rate of group 0 to 1.1611e-04.


 34%|███▎      | 28/83 [00:00<00:00, 132.53it/s]
 52%|█████▏    | 43/83 [00:00<00:00, 137.28it/s]
100%|██████████| 24/24 [00:00<00:00, 266.11it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 16%|█▌        | 13/83 [00:00<00:00, 124.06it/s]
 31%|███▏      | 26/83 [00:00<00:00, 115.72it/s]
 46%|████▌     | 38/83 [00:00<00:00, 112.96it/s]
 61%|██████▏   | 51/83 [00:00<00:00, 115.75it/s]
 76%|███████▌  | 63/83 [00:00<00:00, 107.96it/s]
 95%|█████████▌| 79/83 [00:00<00:00, 121.85it/s]
100%|██████████| 83/83 [00:00<00:00, 118.92it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 326.04it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 18%|█▊        | 15/83 [00:00<00:00, 145.36it/s]
 36%|███▌      | 30/83 [00:00<00:00, 143.30it/s]
 54%|█████▍    | 45/83 [00:00<00:00, 146.18it/s]
100%|██████████| 24/24 [00:00<00:00, 314.84it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 14%|█▍        | 12/83 [00:00<00:00, 116.29it/s]
 33%|███▎      | 27/83 [00:00<00:00, 132.69it/s]
 49%|████▉ 

[2m[36m(func pid=21400)[0m Epoch 00024: reducing learning rate of group 0 to 5.8057e-05.


  0%|          | 0/83 [00:00<?, ?it/s]
 36%|███▌      | 30/83 [00:00<00:00, 146.02it/s]
 54%|█████▍    | 45/83 [00:00<00:00, 147.52it/s]
 72%|███████▏  | 60/83 [00:00<00:00, 145.18it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 235.31it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 14%|█▍        | 12/83 [00:00<00:00, 115.16it/s]
 29%|██▉       | 24/83 [00:00<00:00, 114.10it/s]
 43%|████▎     | 36/83 [00:00<00:00, 114.56it/s]
 58%|█████▊    | 48/83 [00:00<00:00, 115.39it/s]
 73%|███████▎  | 61/83 [00:00<00:00, 119.11it/s]
 88%|████████▊ | 73/83 [00:00<00:00, 115.26it/s]
100%|██████████| 83/83 [00:00<00:00, 118.31it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 323.22it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 18%|█▊        | 15/83 [00:00<00:00, 141.15it/s]
 36%|███▌      | 30/83 [00:00<00:00, 140.84it/s]
 55%|█████▌    | 46/83 [00:00<00:00, 145.92it/s]
 73%|███████▎  | 61/83 [00:00<00:00, 142.17it/s]
100%|██████████| 24/2

[2m[36m(func pid=21400)[0m Epoch 00031: reducing learning rate of group 0 to 2.9029e-05.


 33%|███▎      | 27/83 [00:00<00:00, 129.19it/s]
 48%|████▊     | 40/83 [00:00<00:00, 124.21it/s]
 64%|██████▍   | 53/83 [00:00<00:00, 124.96it/s]
100%|██████████| 83/83 [00:00<00:00, 133.00it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 317.38it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 17%|█▋        | 14/83 [00:00<00:00, 133.09it/s]
 35%|███▍      | 29/83 [00:00<00:00, 141.28it/s]
 53%|█████▎    | 44/83 [00:00<00:00, 143.91it/s]
 89%|████████▉ | 74/83 [00:00<00:00, 144.12it/s]
100%|██████████| 24/24 [00:00<00:00, 281.48it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 34%|███▎      | 28/83 [00:00<00:00, 134.44it/s]
 51%|█████     | 42/83 [00:00<00:00, 124.24it/s]
 66%|██████▋   | 55/83 [00:00<00:00, 125.67it/s]
 82%|████████▏ | 68/83 [00:00<00:00, 117.41it/s]
100%|██████████| 83/83 [00:00<00:00, 123.54it/s]
 21%|██        | 5/24 [00:00<00:00, 49.85it/s]
100%|██████████| 24/24 [00:00<00:00, 150.13it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 19%|█▉      

[2m[36m(func pid=21400)[0m Epoch 00037: reducing learning rate of group 0 to 1.4514e-05.


  0%|          | 0/83 [00:00<?, ?it/s]
 17%|█▋        | 14/83 [00:00<00:00, 136.13it/s]
 34%|███▎      | 28/83 [00:00<00:00, 128.03it/s]
 51%|█████     | 42/83 [00:00<00:00, 130.86it/s]
 67%|██████▋   | 56/83 [00:00<00:00, 123.92it/s]
 86%|████████▌ | 71/83 [00:00<00:00, 130.77it/s]
100%|██████████| 83/83 [00:00<00:00, 132.49it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 303.57it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 18%|█▊        | 15/83 [00:00<00:00, 149.94it/s]
 36%|███▌      | 30/83 [00:00<00:00, 146.01it/s]
 54%|█████▍    | 45/83 [00:00<00:00, 145.61it/s]
 73%|███████▎  | 61/83 [00:00<00:00, 149.50it/s]
100%|██████████| 24/24 [00:00<00:00, 303.90it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
  5%|▍         | 4/83 [00:00<00:02, 30.74it/s]
 22%|██▏       | 18/83 [00:00<00:00, 87.58it/s]
 34%|███▎      | 28/83 [00:00<00:00, 90.91it/s]
 51%|█████     | 42/83 [00:00<00:00, 106.47it/s]
 64%|██████▍   | 53/83 [00:00<00:00, 100.76it/s]
 81%|████████  

[2m[36m(func pid=21400)[0m Epoch 00043: reducing learning rate of group 0 to 7.2571e-06.


 18%|█▊        | 15/83 [00:00<00:00, 142.40it/s]
 36%|███▌      | 30/83 [00:00<00:00, 124.79it/s]
 52%|█████▏    | 43/83 [00:00<00:00, 126.33it/s]
 83%|████████▎ | 69/83 [00:00<00:00, 120.09it/s]
100%|██████████| 83/83 [00:00<00:00, 126.67it/s]
100%|██████████| 24/24 [00:00<00:00, 319.47it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 18%|█▊        | 15/83 [00:00<00:00, 144.13it/s]
 36%|███▌      | 30/83 [00:00<00:00, 144.21it/s]
 73%|███████▎  | 61/83 [00:00<00:00, 147.80it/s]
 93%|█████████▎| 77/83 [00:00<00:00, 150.43it/s]
100%|██████████| 83/83 [00:00<00:00, 148.50it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 316.27it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 12%|█▏        | 10/83 [00:00<00:00, 96.91it/s]
 29%|██▉       | 24/83 [00:00<00:00, 117.19it/s]
 43%|████▎     | 36/83 [00:00<00:00, 114.76it/s]
 58%|█████▊    | 48/83 [00:00<00:00, 113.75it/s]
 75%|███████▍  | 62/83 [00:00<00:00, 122.44it/s]
 92%|█████████▏| 76/83 [00:00<00:00, 128.21it/s]
10

[2m[36m(func pid=21400)[0m Epoch 00049: reducing learning rate of group 0 to 3.6286e-06.


 14%|█▍        | 12/83 [00:00<00:00, 114.33it/s]
 29%|██▉       | 24/83 [00:00<00:00, 113.68it/s]
 46%|████▌     | 38/83 [00:00<00:00, 118.79it/s]
 60%|██████    | 50/83 [00:00<00:00, 112.25it/s]
 76%|███████▌  | 63/83 [00:00<00:00, 115.90it/s]
 93%|█████████▎| 77/83 [00:00<00:00, 121.68it/s]
100%|██████████| 83/83 [00:00<00:00, 105.40it/s]
100%|██████████| 24/24 [00:00<00:00, 296.20it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 16%|█▌        | 13/83 [00:00<00:00, 129.43it/s]
 33%|███▎      | 27/83 [00:00<00:00, 133.69it/s]
 49%|████▉     | 41/83 [00:00<00:00, 134.62it/s]
 67%|██████▋   | 56/83 [00:00<00:00, 137.48it/s]
 84%|████████▍ | 70/83 [00:00<00:00, 135.82it/s]
100%|██████████| 24/24 [00:00<00:00, 237.75it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 14%|█▍        | 12/83 [00:00<00:00, 111.15it/s]
 29%|██▉       | 24/83 [00:00<00:00, 115.94it/s]
 58%|█████▊    | 48/83 [00:00<00:00, 109.36it/s]
 73%|███████▎  | 61/83 [00:00<00:00, 113.79it/s]
 88%|████████▊ | 73/83 [00:00<00:00, 107

[2m[36m(func pid=21400)[0m Epoch 00055: reducing learning rate of group 0 to 1.8143e-06.


 17%|█▋        | 14/83 [00:00<00:00, 138.35it/s]
 34%|███▎      | 28/83 [00:00<00:00, 85.05it/s] 
 51%|█████     | 42/83 [00:00<00:00, 100.50it/s]
 70%|██████▉   | 58/83 [00:00<00:00, 116.99it/s]
100%|██████████| 83/83 [00:00<00:00, 118.21it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 287.04it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 17%|█▋        | 14/83 [00:00<00:00, 136.04it/s]
 35%|███▍      | 29/83 [00:00<00:00, 139.15it/s]
 53%|█████▎    | 44/83 [00:00<00:00, 140.12it/s]
 89%|████████▉ | 74/83 [00:00<00:00, 140.65it/s]
100%|██████████| 24/24 [00:00<00:00, 243.99it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 31%|███▏      | 26/83 [00:00<00:00, 124.08it/s]
 48%|████▊     | 40/83 [00:00<00:00, 127.78it/s]
 64%|██████▍   | 53/83 [00:00<00:00, 120.06it/s]
 80%|███████▉  | 66/83 [00:00<00:00, 117.35it/s]
100%|██████████| 83/83 [00:00<00:00, 124.10it/s]
100%|██████████| 24/24 [00:00<00:00, 304.67it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 18%|█▊    

[2m[36m(func pid=21400)[0m Epoch 00061: reducing learning rate of group 0 to 9.0714e-07.


 17%|█▋        | 14/83 [00:00<00:00, 129.71it/s]
 33%|███▎      | 27/83 [00:00<00:00, 113.51it/s]
 51%|█████     | 42/83 [00:00<00:00, 125.22it/s]
 66%|██████▋   | 55/83 [00:00<00:00, 121.53it/s]
 82%|████████▏ | 68/83 [00:00<00:00, 122.20it/s]
100%|██████████| 83/83 [00:00<00:00, 126.85it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 311.39it/s]
 18%|█▊        | 15/83 [00:00<00:00, 145.15it/s]
 36%|███▌      | 30/83 [00:00<00:00, 139.90it/s]
 54%|█████▍    | 45/83 [00:00<00:00, 140.85it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 303.11it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 18%|█▊        | 15/83 [00:00<00:00, 143.25it/s]
 36%|███▌      | 30/83 [00:00<00:00, 133.11it/s]
 53%|█████▎    | 44/83 [00:00<00:00, 131.91it/s]
 70%|██████▉   | 58/83 [00:00<00:00, 132.74it/s]
100%|██████████| 83/83 [00:00<00:00, 132.13it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 330.27it/s]
  0%|      

[2m[36m(func pid=21400)[0m Epoch 00067: reducing learning rate of group 0 to 4.5357e-07.


 17%|█▋        | 14/83 [00:00<00:00, 139.87it/s]
 34%|███▎      | 28/83 [00:00<00:00, 124.16it/s]
 49%|████▉     | 41/83 [00:00<00:00, 126.63it/s]
 65%|██████▌   | 54/83 [00:00<00:00, 121.64it/s]
 81%|████████  | 67/83 [00:00<00:00, 113.72it/s]
100%|██████████| 83/83 [00:00<00:00, 122.82it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 296.27it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 18%|█▊        | 15/83 [00:00<00:00, 141.32it/s]
 36%|███▌      | 30/83 [00:00<00:00, 138.98it/s]
 54%|█████▍    | 45/83 [00:00<00:00, 141.41it/s]
100%|██████████| 24/24 [00:00<00:00, 310.72it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 17%|█▋        | 14/83 [00:00<00:00, 138.22it/s]
 34%|███▎      | 28/83 [00:00<00:00, 85.64it/s] 
 51%|█████     | 42/83 [00:00<00:00, 102.09it/s]
 65%|██████▌   | 54/83 [00:00<00:00, 103.83it/s]
 84%|████████▍ | 70/83 [00:00<00:00, 119.77it/s]
100%|██████████| 83/83 [00:00<00:00, 116.07it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████

[2m[36m(func pid=21400)[0m Epoch 00073: reducing learning rate of group 0 to 2.2679e-07.


  0%|          | 0/83 [00:00<?, ?it/s]
 17%|█▋        | 14/83 [00:00<00:00, 137.67it/s]
 34%|███▎      | 28/83 [00:00<00:00, 125.66it/s]
 49%|████▉     | 41/83 [00:00<00:00, 122.19it/s]
 65%|██████▌   | 54/83 [00:00<00:00, 120.71it/s]
 83%|████████▎ | 69/83 [00:00<00:00, 129.15it/s]
100%|██████████| 83/83 [00:00<00:00, 130.95it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 300.90it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 17%|█▋        | 14/83 [00:00<00:00, 138.65it/s]
 35%|███▍      | 29/83 [00:00<00:00, 141.21it/s]
 53%|█████▎    | 44/83 [00:00<00:00, 103.89it/s]
 72%|███████▏  | 60/83 [00:00<00:00, 119.39it/s]
 92%|█████████▏| 76/83 [00:00<00:00, 131.06it/s]
100%|██████████| 83/83 [00:00<00:00, 128.24it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 305.84it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 14%|█▍        | 12/83 [00:00<00:00, 119.02it/s]
 33%|███▎      | 27/83 [00:00<00:00, 132.61it/s]
 49%|████▉     | 41/8

[2m[36m(func pid=21400)[0m Epoch 00079: reducing learning rate of group 0 to 1.1339e-07.


 29%|██▉       | 24/83 [00:00<00:00, 117.57it/s]
 45%|████▍     | 37/83 [00:00<00:00, 119.57it/s]
 59%|█████▉    | 49/83 [00:00<00:00, 116.48it/s]
 73%|███████▎  | 61/83 [00:00<00:00, 117.30it/s]
 92%|█████████▏| 76/83 [00:00<00:00, 127.75it/s]
100%|██████████| 83/83 [00:00<00:00, 123.35it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 296.00it/s]
 18%|█▊        | 15/83 [00:00<00:00, 145.82it/s]
 36%|███▌      | 30/83 [00:00<00:00, 143.28it/s]
 55%|█████▌    | 46/83 [00:00<00:00, 147.48it/s]
 73%|███████▎  | 61/83 [00:00<00:00, 145.72it/s]
100%|██████████| 24/24 [00:00<00:00, 324.55it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 17%|█▋        | 14/83 [00:00<00:00, 136.49it/s]
 34%|███▎      | 28/83 [00:00<00:00, 129.30it/s]
 49%|████▉     | 41/83 [00:00<00:00, 124.73it/s]
 66%|██████▋   | 55/83 [00:00<00:00, 124.83it/s]
 82%|████████▏ | 68/83 [00:00<00:00, 115.61it/s]
100%|██████████| 83/83 [00:00<00:00, 125.65it/s]
100%|██████████| 24/24 [00:00<00:00, 335

[2m[36m(func pid=21400)[0m Epoch 00085: reducing learning rate of group 0 to 5.6696e-08.


  7%|▋         | 6/83 [00:00<00:01, 39.22it/s]
 20%|██        | 17/83 [00:00<00:00, 71.21it/s]
 36%|███▌      | 30/83 [00:00<00:00, 93.47it/s]
 49%|████▉     | 41/83 [00:00<00:00, 99.05it/s]
 64%|██████▍   | 53/83 [00:00<00:00, 104.06it/s]
 81%|████████  | 67/83 [00:00<00:00, 113.36it/s]
 96%|█████████▋| 80/83 [00:00<00:00, 115.48it/s]
100%|██████████| 83/83 [00:00<00:00, 102.34it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 276.52it/s]
 17%|█▋        | 14/83 [00:00<00:00, 134.73it/s]
 34%|███▎      | 28/83 [00:00<00:00, 128.64it/s]
 49%|████▉     | 41/83 [00:00<00:00, 122.49it/s]
 66%|██████▋   | 55/83 [00:00<00:00, 127.89it/s]
 82%|████████▏ | 68/83 [00:00<00:00, 126.84it/s]
100%|██████████| 24/24 [00:00<00:00, 253.88it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 27%|██▋       | 22/83 [00:00<00:00, 107.34it/s]
 41%|████      | 34/83 [00:00<00:00, 110.59it/s]
 57%|█████▋    | 47/83 [00:00<00:00, 114.13it/s]
 71%|███████   | 59/83 [00:00<00:00, 107.82it

[2m[36m(func pid=21400)[0m Epoch 00091: reducing learning rate of group 0 to 2.8348e-08.


 29%|██▉       | 24/83 [00:00<00:00, 114.28it/s]
 43%|████▎     | 36/83 [00:00<00:00, 81.28it/s] 
 57%|█████▋    | 47/83 [00:00<00:00, 89.71it/s]
 87%|████████▋ | 72/83 [00:00<00:00, 105.56it/s]
100%|██████████| 83/83 [00:00<00:00, 103.42it/s]
100%|██████████| 24/24 [00:00<00:00, 315.55it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 18%|█▊        | 15/83 [00:00<00:00, 147.42it/s]
 36%|███▌      | 30/83 [00:00<00:00, 145.33it/s]
 55%|█████▌    | 46/83 [00:00<00:00, 149.78it/s]
 73%|███████▎  | 61/83 [00:00<00:00, 146.86it/s]
 92%|█████████▏| 76/83 [00:00<00:00, 143.17it/s]
100%|██████████| 83/83 [00:00<00:00, 144.18it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 258.54it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 17%|█▋        | 14/83 [00:00<00:00, 139.71it/s]
 34%|███▎      | 28/83 [00:00<00:00, 131.17it/s]
 51%|█████     | 42/83 [00:00<00:00, 126.29it/s]
 66%|██████▋   | 55/83 [00:00<00:00, 122.61it/s]
 82%|████████▏ | 68/83 [00:00<00:00, 123.70it/s]
10

[2m[36m(func pid=21400)[0m Epoch 00097: reducing learning rate of group 0 to 1.4174e-08.


 18%|█▊        | 15/83 [00:00<00:00, 141.25it/s]
 36%|███▌      | 30/83 [00:00<00:00, 119.27it/s]
 54%|█████▍    | 45/83 [00:00<00:00, 129.30it/s]
 71%|███████   | 59/83 [00:00<00:00, 118.68it/s]
 87%|████████▋ | 72/83 [00:00<00:00, 119.52it/s]
100%|██████████| 83/83 [00:00<00:00, 123.84it/s]
  0%|          | 0/24 [00:00<?, ?it/s]
100%|██████████| 24/24 [00:00<00:00, 300.30it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 18%|█▊        | 15/83 [00:00<00:00, 145.62it/s]
 36%|███▌      | 30/83 [00:00<00:00, 146.49it/s]
 54%|█████▍    | 45/83 [00:00<00:00, 147.56it/s]
100%|██████████| 24/24 [00:00<00:00, 268.87it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 17%|█▋        | 14/83 [00:00<00:00, 132.74it/s]
 51%|█████     | 42/83 [00:00<00:00, 127.97it/s]
 66%|██████▋   | 55/83 [00:00<00:00, 120.54it/s]
 82%|████████▏ | 68/83 [00:00<00:00, 116.92it/s]
100%|██████████| 83/83 [00:00<00:00, 124.34it/s]
100%|██████████| 24/24 [00:00<00:00, 333.18it/s]
  0%|          | 0/83 [00:00<?, ?it/s]
 18%|█▊    

[2m[36m(func pid=11576)[0m Epoch 00013: reducing learning rate of group 0 to 2.3997e-02.


 10%|▉         | 16/166 [00:00<00:00, 156.69it/s]
 19%|█▉        | 32/166 [00:00<00:01, 132.49it/s]
 28%|██▊       | 46/166 [00:00<00:00, 135.04it/s]
 37%|███▋      | 62/166 [00:00<00:00, 141.54it/s]
 48%|████▊     | 79/166 [00:00<00:00, 148.31it/s]
 57%|█████▋    | 95/166 [00:00<00:00, 148.17it/s]
 66%|██████▋   | 110/166 [00:00<00:00, 142.87it/s]
 77%|███████▋  | 127/166 [00:00<00:00, 149.10it/s]
 87%|████████▋ | 145/166 [00:00<00:00, 158.00it/s]
100%|██████████| 166/166 [00:01<00:00, 151.47it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 462.74it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  9%|▉         | 15/166 [00:00<00:01, 142.95it/s]
 19%|█▉        | 32/166 [00:00<00:00, 154.73it/s]
 30%|███       | 50/166 [00:00<00:00, 161.21it/s]
 41%|████      | 68/166 [00:00<00:00, 167.10it/s]
 52%|█████▏    | 86/166 [00:00<00:00, 169.68it/s]
 63%|██████▎   | 105/166 [00:00<00:00, 174.13it/s]
 74%|███████▍  | 123/166 [00:00<00:00, 160.70it/s]
 84%|████████▍ |

[2m[36m(func pid=11576)[0m Epoch 00019: reducing learning rate of group 0 to 1.1999e-02.


  0%|          | 0/166 [00:00<?, ?it/s]
 10%|█         | 17/166 [00:00<00:00, 162.74it/s]
 30%|███       | 50/166 [00:00<00:00, 148.27it/s]
 39%|███▉      | 65/166 [00:00<00:00, 140.04it/s]
 48%|████▊     | 80/166 [00:00<00:00, 128.70it/s]
 57%|█████▋    | 95/166 [00:00<00:00, 134.45it/s]
 68%|██████▊   | 113/166 [00:00<00:00, 146.32it/s]
 79%|███████▉  | 131/166 [00:00<00:00, 154.85it/s]
100%|██████████| 166/166 [00:01<00:00, 152.11it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 520.72it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
 10%|▉         | 16/166 [00:00<00:00, 158.15it/s]
 19%|█▉        | 32/166 [00:00<00:00, 153.89it/s]
 29%|██▉       | 48/166 [00:00<00:00, 149.16it/s]
 48%|████▊     | 79/166 [00:00<00:00, 149.00it/s]
 57%|█████▋    | 95/166 [00:00<00:00, 150.09it/s]
 67%|██████▋   | 112/166 [00:00<00:00, 154.45it/s]
 77%|███████▋  | 128/166 [00:00<00:00, 141.42it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 3

[2m[36m(func pid=11576)[0m Epoch 00025: reducing learning rate of group 0 to 5.9993e-03.


  8%|▊         | 13/166 [00:00<00:01, 124.99it/s]
 17%|█▋        | 28/166 [00:00<00:00, 138.93it/s]
 25%|██▌       | 42/166 [00:00<00:00, 136.60it/s]
 34%|███▍      | 57/166 [00:00<00:00, 140.35it/s]
 52%|█████▏    | 86/166 [00:00<00:00, 127.86it/s]
 61%|██████    | 101/166 [00:00<00:00, 133.66it/s]
 71%|███████   | 118/166 [00:00<00:00, 142.88it/s]
 82%|████████▏ | 136/166 [00:00<00:00, 152.87it/s]
100%|██████████| 166/166 [00:01<00:00, 146.02it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 508.44it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
 11%|█         | 18/166 [00:00<00:00, 174.40it/s]
 22%|██▏       | 36/166 [00:00<00:00, 156.81it/s]
 31%|███▏      | 52/166 [00:00<00:00, 154.87it/s]
 41%|████      | 68/166 [00:00<00:00, 153.38it/s]
 51%|█████     | 85/166 [00:00<00:00, 158.04it/s]
 62%|██████▏   | 103/166 [00:00<00:00, 163.48it/s]
 72%|███████▏  | 120/166 [00:00<00:00, 156.69it/s]
 82%|████████▏ | 136/166 [00:00<00:00, 151.75it/s]
  0%|          

[2m[36m(func pid=11576)[0m Epoch 00031: reducing learning rate of group 0 to 2.9997e-03.


 15%|█▌        | 25/166 [00:00<00:01, 123.77it/s]
 23%|██▎       | 38/166 [00:00<00:01, 115.42it/s]
 31%|███▏      | 52/166 [00:00<00:00, 121.79it/s]
 39%|███▉      | 65/166 [00:00<00:00, 113.11it/s]
 46%|████▋     | 77/166 [00:00<00:00, 115.23it/s]
 55%|█████▍    | 91/166 [00:00<00:00, 122.41it/s]
 72%|███████▏  | 120/166 [00:00<00:00, 131.24it/s]
 81%|████████▏ | 135/166 [00:01<00:00, 136.37it/s]
 90%|█████████ | 150/166 [00:01<00:00, 140.06it/s]
100%|██████████| 166/166 [00:01<00:00, 130.62it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 521.59it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
 18%|█▊        | 30/166 [00:00<00:00, 141.96it/s]
 27%|██▋       | 45/166 [00:00<00:00, 141.02it/s]
 38%|███▊      | 63/166 [00:00<00:00, 153.06it/s]
 48%|████▊     | 80/166 [00:00<00:00, 156.09it/s]
 58%|█████▊    | 96/166 [00:00<00:00, 156.85it/s]
 68%|██████▊   | 113/166 [00:00<00:00, 159.13it/s]
 79%|███████▉  | 131/166 [00:00<00:00, 163.97it/s]
 90%|█████████ |

[2m[36m(func pid=11576)[0m Epoch 00037: reducing learning rate of group 0 to 1.4998e-03.


  7%|▋         | 11/166 [00:00<00:01, 102.63it/s]
 13%|█▎        | 22/166 [00:00<00:01, 99.46it/s] 
 20%|█▉        | 33/166 [00:00<00:01, 101.40it/s]
 27%|██▋       | 44/166 [00:00<00:01, 102.40it/s]
 33%|███▎      | 55/166 [00:00<00:01, 103.79it/s]
 40%|████      | 67/166 [00:00<00:00, 108.41it/s]
 47%|████▋     | 78/166 [00:00<00:00, 108.61it/s]
 55%|█████▌    | 92/166 [00:00<00:00, 117.34it/s]
 65%|██████▌   | 108/166 [00:00<00:00, 128.09it/s]
 74%|███████▍  | 123/166 [00:01<00:00, 133.77it/s]
 84%|████████▍ | 140/166 [00:01<00:00, 142.55it/s]
 93%|█████████▎| 155/166 [00:01<00:00, 141.77it/s]
100%|██████████| 166/166 [00:01<00:00, 123.97it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 406.58it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  9%|▉         | 15/166 [00:00<00:01, 143.86it/s]
 18%|█▊        | 30/166 [00:00<00:00, 140.76it/s]
 27%|██▋       | 45/166 [00:00<00:01, 95.94it/s] 
 36%|███▌      | 60/166 [00:00<00:00, 111.81it/s]
 45%|████▌     | 

[2m[36m(func pid=11576)[0m Epoch 00043: reducing learning rate of group 0 to 7.4992e-04.


  9%|▉         | 15/166 [00:00<00:01, 149.86it/s]
 18%|█▊        | 30/166 [00:00<00:01, 127.90it/s]
 26%|██▌       | 43/166 [00:00<00:01, 117.95it/s]
 34%|███▎      | 56/166 [00:00<00:00, 121.14it/s]
 42%|████▏     | 69/166 [00:00<00:00, 113.07it/s]
 49%|████▉     | 81/166 [00:00<00:00, 94.58it/s] 
 69%|██████▊   | 114/166 [00:00<00:00, 126.64it/s]
 79%|███████▉  | 131/166 [00:01<00:00, 137.05it/s]
 89%|████████▉ | 148/166 [00:01<00:00, 144.72it/s]
100%|██████████| 166/166 [00:01<00:00, 129.86it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 484.72it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
 10%|▉         | 16/166 [00:00<00:00, 152.56it/s]
 19%|█▉        | 32/166 [00:00<00:00, 146.76it/s]
 30%|██▉       | 49/166 [00:00<00:00, 152.78it/s]
 49%|████▉     | 82/166 [00:00<00:00, 153.62it/s]
 60%|██████    | 100/166 [00:00<00:00, 159.08it/s]
 71%|███████   | 118/166 [00:00<00:00, 162.89it/s]
 81%|████████▏ | 135/166 [00:00<00:00, 164.76it/s]
100%|██████████

[2m[36m(func pid=11576)[0m Epoch 00049: reducing learning rate of group 0 to 3.7496e-04.


 16%|█▌        | 26/166 [00:00<00:01, 129.17it/s]
 25%|██▍       | 41/166 [00:00<00:00, 138.08it/s]
 33%|███▎      | 55/166 [00:00<00:00, 128.28it/s]
 43%|████▎     | 71/166 [00:00<00:00, 136.28it/s]
 54%|█████▎    | 89/166 [00:00<00:00, 149.96it/s]
 64%|██████▍   | 106/166 [00:00<00:00, 155.74it/s]
 73%|███████▎  | 122/166 [00:00<00:00, 149.12it/s]
 84%|████████▍ | 140/166 [00:00<00:00, 156.31it/s]
 95%|█████████▌| 158/166 [00:01<00:00, 162.69it/s]
100%|██████████| 166/166 [00:01<00:00, 150.10it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 473.91it/s]
 11%|█         | 18/166 [00:00<00:00, 171.64it/s]
 22%|██▏       | 36/166 [00:00<00:00, 173.58it/s]
 33%|███▎      | 54/166 [00:00<00:00, 166.46it/s]
 43%|████▎     | 71/166 [00:00<00:00, 162.36it/s]
 53%|█████▎    | 88/166 [00:00<00:00, 162.59it/s]
 63%|██████▎   | 105/166 [00:00<00:00, 163.95it/s]
 73%|███████▎  | 122/166 [00:00<00:00, 162.83it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
 88%|████████▊ |

[2m[36m(func pid=11576)[0m Epoch 00055: reducing learning rate of group 0 to 1.8748e-04.


  8%|▊         | 14/166 [00:00<00:01, 135.46it/s]
 17%|█▋        | 29/166 [00:00<00:00, 140.52it/s]
 27%|██▋       | 44/166 [00:00<00:00, 131.23it/s]
 36%|███▌      | 59/166 [00:00<00:00, 135.32it/s]
 45%|████▌     | 75/166 [00:00<00:00, 141.60it/s]
 55%|█████▌    | 92/166 [00:00<00:00, 148.49it/s]
 66%|██████▌   | 109/166 [00:00<00:00, 153.22it/s]
 76%|███████▌  | 126/166 [00:00<00:00, 157.14it/s]
 86%|████████▌ | 142/166 [00:00<00:00, 154.50it/s]
 96%|█████████▌| 159/166 [00:01<00:00, 157.38it/s]
100%|██████████| 166/166 [00:01<00:00, 150.18it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 486.29it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  9%|▉         | 15/166 [00:00<00:01, 142.65it/s]
 18%|█▊        | 30/166 [00:00<00:00, 145.68it/s]
 29%|██▉       | 48/166 [00:00<00:00, 157.90it/s]
 39%|███▉      | 65/166 [00:00<00:00, 161.83it/s]
 49%|████▉     | 82/166 [00:00<00:00, 164.23it/s]
 60%|█████▉    | 99/166 [00:00<00:00, 165.03it/s]
 70%|███████   | 

[2m[36m(func pid=11576)[0m Epoch 00061: reducing learning rate of group 0 to 9.3740e-05.


 20%|█▉        | 33/166 [00:00<00:00, 159.37it/s]
 30%|██▉       | 49/166 [00:00<00:00, 151.42it/s]
 39%|███▉      | 65/166 [00:00<00:00, 149.53it/s]
 60%|█████▉    | 99/166 [00:00<00:00, 154.22it/s]
 69%|██████▉   | 115/166 [00:00<00:00, 148.73it/s]
 80%|████████  | 133/166 [00:00<00:00, 156.14it/s]
 90%|█████████ | 150/166 [00:00<00:00, 158.89it/s]
100%|██████████| 166/166 [00:01<00:00, 156.77it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 516.37it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  8%|▊         | 14/166 [00:00<00:01, 136.60it/s]
 19%|█▉        | 32/166 [00:00<00:00, 160.36it/s]
 30%|██▉       | 49/166 [00:00<00:00, 163.22it/s]
 40%|████      | 67/166 [00:00<00:00, 168.39it/s]
 51%|█████     | 84/166 [00:00<00:00, 167.27it/s]
 61%|██████    | 101/166 [00:00<00:00, 155.65it/s]
 70%|███████   | 117/166 [00:00<00:00, 134.80it/s]
 79%|███████▉  | 131/166 [00:00<00:00, 125.22it/s]
 89%|████████▊ | 147/166 [00:01<00:00, 132.52it/s]
  0%|         

[2m[36m(func pid=11576)[0m Epoch 00067: reducing learning rate of group 0 to 4.6870e-05.


  8%|▊         | 14/166 [00:00<00:01, 130.98it/s]
 17%|█▋        | 28/166 [00:00<00:01, 122.82it/s]
 33%|███▎      | 54/166 [00:00<00:00, 118.55it/s]
 40%|███▉      | 66/166 [00:00<00:00, 111.55it/s]
 49%|████▉     | 81/166 [00:00<00:00, 122.21it/s]
 60%|██████    | 100/166 [00:00<00:00, 141.03it/s]
 72%|███████▏  | 119/166 [00:00<00:00, 154.56it/s]
 83%|████████▎ | 138/166 [00:00<00:00, 162.69it/s]
100%|██████████| 166/166 [00:01<00:00, 145.02it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 409.92it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
 10%|█         | 17/166 [00:00<00:00, 163.41it/s]
 20%|██        | 34/166 [00:00<00:00, 157.38it/s]
 30%|███       | 50/166 [00:00<00:00, 154.31it/s]
 40%|███▉      | 66/166 [00:00<00:00, 154.15it/s]
 51%|█████     | 84/166 [00:00<00:00, 160.24it/s]
 61%|██████▏   | 102/166 [00:00<00:00, 164.14it/s]
 72%|███████▏  | 120/166 [00:00<00:00, 167.56it/s]
 83%|████████▎ | 137/166 [00:00<00:00, 167.13it/s]
  0%|          

[2m[36m(func pid=11576)[0m Epoch 00073: reducing learning rate of group 0 to 2.3435e-05.


 15%|█▌        | 25/166 [00:00<00:01, 121.37it/s]
 23%|██▎       | 38/166 [00:00<00:01, 110.69it/s]
 30%|███       | 50/166 [00:00<00:01, 111.98it/s]
 39%|███▉      | 65/166 [00:00<00:00, 122.24it/s]
 49%|████▉     | 81/166 [00:00<00:00, 132.50it/s]
 58%|█████▊    | 97/166 [00:00<00:00, 139.92it/s]
 68%|██████▊   | 113/166 [00:00<00:00, 144.64it/s]
 77%|███████▋  | 128/166 [00:00<00:00, 145.29it/s]
 87%|████████▋ | 144/166 [00:01<00:00, 148.34it/s]
100%|██████████| 166/166 [00:01<00:00, 137.74it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 490.17it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
 10%|█         | 17/166 [00:00<00:00, 169.80it/s]
 22%|██▏       | 36/166 [00:00<00:00, 175.97it/s]
 33%|███▎      | 54/166 [00:00<00:00, 176.27it/s]
 43%|████▎     | 72/166 [00:00<00:00, 136.39it/s]
 54%|█████▍    | 90/166 [00:00<00:00, 147.30it/s]
 64%|██████▍   | 106/166 [00:00<00:00, 140.44it/s]
 82%|████████▏ | 136/166 [00:00<00:00, 142.58it/s]
 92%|█████████▏|

[2m[36m(func pid=11576)[0m Epoch 00079: reducing learning rate of group 0 to 1.1717e-05.


 16%|█▌        | 26/166 [00:00<00:01, 128.60it/s]
 23%|██▎       | 39/166 [00:00<00:01, 122.72it/s]
 33%|███▎      | 54/166 [00:00<00:00, 131.60it/s]
 41%|████      | 68/166 [00:00<00:00, 120.55it/s]
 49%|████▉     | 81/166 [00:00<00:00, 119.77it/s]
 58%|█████▊    | 97/166 [00:00<00:00, 106.21it/s]
 67%|██████▋   | 112/166 [00:00<00:00, 117.32it/s]
 78%|███████▊  | 130/166 [00:01<00:00, 132.85it/s]
 89%|████████▉ | 148/166 [00:01<00:00, 144.39it/s]
 99%|█████████▉| 165/166 [00:01<00:00, 151.19it/s]
100%|██████████| 166/166 [00:01<00:00, 131.66it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 497.74it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  9%|▉         | 15/166 [00:00<00:01, 144.48it/s]
 18%|█▊        | 30/166 [00:00<00:00, 146.68it/s]
 27%|██▋       | 45/166 [00:00<00:00, 142.51it/s]
 36%|███▌      | 60/166 [00:00<00:00, 143.25it/s]
 46%|████▌     | 76/166 [00:00<00:00, 147.01it/s]
 56%|█████▌    | 93/166 [00:00<00:00, 154.02it/s]
 66%|██████▌   | 

[2m[36m(func pid=11576)[0m Epoch 00085: reducing learning rate of group 0 to 5.8587e-06.


  0%|          | 0/166 [00:00<?, ?it/s]
  8%|▊         | 14/166 [00:00<00:01, 139.66it/s]
 17%|█▋        | 28/166 [00:00<00:01, 126.84it/s]
 25%|██▍       | 41/166 [00:00<00:00, 127.39it/s]
 33%|███▎      | 54/166 [00:00<00:00, 125.29it/s]
 40%|████      | 67/166 [00:00<00:00, 122.47it/s]
 49%|████▉     | 82/166 [00:00<00:00, 129.34it/s]
 58%|█████▊    | 97/166 [00:00<00:00, 135.54it/s]
 77%|███████▋  | 128/166 [00:00<00:00, 145.66it/s]
 86%|████████▌ | 143/166 [00:01<00:00, 144.61it/s]
100%|██████████| 166/166 [00:01<00:00, 138.92it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 475.20it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  9%|▉         | 15/166 [00:00<00:01, 145.71it/s]
 18%|█▊        | 30/166 [00:00<00:00, 145.33it/s]
 28%|██▊       | 46/166 [00:00<00:00, 151.53it/s]
 38%|███▊      | 63/166 [00:00<00:00, 158.71it/s]
 59%|█████▉    | 98/166 [00:00<00:00, 165.79it/s]
 70%|██████▉   | 116/166 [00:00<00:00, 167.25it/s]
 80%|████████  | 133/166 [00

[2m[36m(func pid=11576)[0m Epoch 00091: reducing learning rate of group 0 to 2.9294e-06.


  8%|▊         | 14/166 [00:00<00:01, 139.54it/s]
 17%|█▋        | 28/166 [00:00<00:01, 126.05it/s]
 25%|██▍       | 41/166 [00:00<00:01, 122.83it/s]
 33%|███▎      | 54/166 [00:00<00:00, 121.84it/s]
 40%|████      | 67/166 [00:00<00:00, 117.45it/s]
 49%|████▉     | 82/166 [00:00<00:00, 126.67it/s]
 58%|█████▊    | 97/166 [00:00<00:00, 132.93it/s]
 68%|██████▊   | 113/166 [00:00<00:00, 141.11it/s]
 78%|███████▊  | 130/166 [00:00<00:00, 148.92it/s]
 89%|████████▉ | 148/166 [00:01<00:00, 156.34it/s]
100%|██████████| 166/166 [00:01<00:00, 140.16it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 505.65it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
 10%|█         | 17/166 [00:00<00:00, 169.83it/s]
 20%|██        | 34/166 [00:00<00:00, 155.52it/s]
 30%|███       | 50/166 [00:00<00:00, 152.68it/s]
 40%|███▉      | 66/166 [00:00<00:00, 152.04it/s]
 50%|█████     | 83/166 [00:00<00:00, 155.07it/s]
 60%|██████    | 100/166 [00:00<00:00, 159.38it/s]
 70%|███████   | 

[2m[36m(func pid=11576)[0m Epoch 00097: reducing learning rate of group 0 to 1.4647e-06.


  0%|          | 0/166 [00:00<?, ?it/s]
 15%|█▌        | 25/166 [00:00<00:01, 123.23it/s]
 23%|██▎       | 38/166 [00:00<00:01, 123.43it/s]
 32%|███▏      | 53/166 [00:00<00:00, 131.74it/s]
 40%|████      | 67/166 [00:00<00:00, 124.08it/s]
 49%|████▉     | 81/166 [00:00<00:00, 128.52it/s]
 69%|██████▉   | 115/166 [00:00<00:00, 145.51it/s]
 79%|███████▉  | 131/166 [00:00<00:00, 149.41it/s]
 89%|████████▊ | 147/166 [00:01<00:00, 152.52it/s]
100%|██████████| 166/166 [00:01<00:00, 140.07it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 409.90it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
 10%|▉         | 16/166 [00:00<00:00, 158.88it/s]
 19%|█▉        | 32/166 [00:00<00:00, 157.92it/s]
 30%|██▉       | 49/166 [00:00<00:00, 160.71it/s]
 40%|███▉      | 66/166 [00:00<00:00, 159.75it/s]
 49%|████▉     | 82/166 [00:00<00:00, 158.62it/s]
 60%|█████▉    | 99/166 [00:00<00:00, 158.25it/s]
 69%|██████▉   | 115/166 [00:00<00:00, 156.86it/s]
 79%|███████▉  | 131/166 [0

[2m[36m(func pid=11576)[0m Epoch 00103: reducing learning rate of group 0 to 7.3234e-07.


  8%|▊         | 13/166 [00:00<00:01, 123.22it/s]
 16%|█▌        | 26/166 [00:00<00:01, 112.12it/s]
 23%|██▎       | 38/166 [00:00<00:01, 113.61it/s]
 33%|███▎      | 54/166 [00:00<00:00, 126.95it/s]
 40%|████      | 67/166 [00:00<00:00, 123.82it/s]
 49%|████▉     | 82/166 [00:00<00:00, 130.03it/s]
 58%|█████▊    | 97/166 [00:00<00:00, 135.96it/s]
 67%|██████▋   | 111/166 [00:00<00:00, 132.57it/s]
 75%|███████▌  | 125/166 [00:00<00:00, 131.75it/s]
 85%|████████▍ | 141/166 [00:01<00:00, 138.01it/s]
100%|██████████| 166/166 [00:01<00:00, 133.47it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 485.78it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
 10%|▉         | 16/166 [00:00<00:00, 156.85it/s]
 19%|█▉        | 32/166 [00:00<00:00, 154.76it/s]
 30%|██▉       | 49/166 [00:00<00:00, 156.75it/s]
 39%|███▉      | 65/166 [00:00<00:00, 152.54it/s]
 49%|████▉     | 81/166 [00:00<00:00, 146.53it/s]
 58%|█████▊    | 96/166 [00:00<00:00, 139.17it/s]
 67%|██████▋   | 1

[2m[36m(func pid=11576)[0m Epoch 00109: reducing learning rate of group 0 to 3.6617e-07.


  7%|▋         | 12/166 [00:00<00:01, 119.80it/s]
 16%|█▌        | 26/166 [00:00<00:01, 127.15it/s]
 23%|██▎       | 39/166 [00:00<00:01, 125.66it/s]
 33%|███▎      | 54/166 [00:00<00:00, 131.54it/s]
 41%|████      | 68/166 [00:00<00:00, 133.12it/s]
 51%|█████     | 84/166 [00:00<00:00, 141.99it/s]
 61%|██████    | 101/166 [00:00<00:00, 147.36it/s]
 70%|██████▉   | 116/166 [00:00<00:00, 147.65it/s]
 80%|████████  | 133/166 [00:00<00:00, 150.92it/s]
 90%|█████████ | 150/166 [00:01<00:00, 154.54it/s]
100%|██████████| 166/166 [00:01<00:00, 145.09it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 464.78it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  8%|▊         | 14/166 [00:00<00:01, 139.38it/s]
 27%|██▋       | 45/166 [00:00<00:00, 146.86it/s]
 36%|███▌      | 60/166 [00:00<00:00, 146.77it/s]
 45%|████▌     | 75/166 [00:00<00:00, 112.34it/s]
 53%|█████▎    | 88/166 [00:00<00:00, 109.64it/s]
 67%|██████▋   | 112/166 [00:00<00:00, 114.48it/s]
 75%|███████▍  |

[2m[36m(func pid=11576)[0m Epoch 00115: reducing learning rate of group 0 to 1.8309e-07.


 20%|██        | 34/166 [00:00<00:00, 156.40it/s]
 30%|███       | 50/166 [00:00<00:00, 154.05it/s]
 40%|███▉      | 66/166 [00:00<00:00, 151.18it/s]
 49%|████▉     | 82/166 [00:00<00:00, 151.85it/s]
 59%|█████▉    | 98/166 [00:00<00:00, 152.79it/s]
 69%|██████▊   | 114/166 [00:00<00:00, 122.52it/s]
 79%|███████▉  | 131/166 [00:00<00:00, 132.96it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 349.90it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  8%|▊         | 13/166 [00:00<00:01, 124.57it/s]
 16%|█▌        | 26/166 [00:00<00:01, 120.23it/s]
 23%|██▎       | 39/166 [00:00<00:01, 123.08it/s]
 32%|███▏      | 53/166 [00:00<00:00, 129.43it/s]
 48%|████▊     | 80/166 [00:00<00:00, 120.49it/s]
 57%|█████▋    | 95/166 [00:00<00:00, 128.18it/s]
 67%|██████▋   | 111/166 [00:00<00:00, 137.29it/s]
 76%|███████▌  | 126/166 [00:00<00:00, 139.64it/s]
 86%|████████▌ | 142/166 [00:01<00:00, 143.39it/s]
100%|██████████| 166/166 [00:01<00:00, 134.13it/s]
  0%|          |

[2m[36m(func pid=11576)[0m Epoch 00121: reducing learning rate of group 0 to 9.1543e-08.


 18%|█▊        | 30/166 [00:00<00:00, 146.72it/s]
 27%|██▋       | 45/166 [00:00<00:00, 140.45it/s]
 37%|███▋      | 61/166 [00:00<00:00, 146.59it/s]
 46%|████▋     | 77/166 [00:00<00:00, 148.80it/s]
 55%|█████▌    | 92/166 [00:00<00:00, 148.30it/s]
 65%|██████▌   | 108/166 [00:00<00:00, 151.94it/s]
 75%|███████▍  | 124/166 [00:00<00:00, 150.63it/s]
 84%|████████▍ | 140/166 [00:00<00:00, 149.72it/s]
 94%|█████████▍| 156/166 [00:01<00:00, 150.68it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
 81%|████████▏ | 39/48 [00:00<00:00, 379.16it/s]
100%|██████████| 48/48 [00:00<00:00, 372.24it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  9%|▉         | 15/166 [00:00<00:01, 149.73it/s]
 18%|█▊        | 30/166 [00:00<00:00, 139.31it/s]
 27%|██▋       | 44/166 [00:00<00:00, 136.66it/s]
 36%|███▌      | 59/166 [00:00<00:00, 140.06it/s]
 45%|████▍     | 74/166 [00:00<00:00, 128.74it/s]
 54%|█████▎    | 89/166 [00:00<00:00, 133.64it/s]
 63%|██████▎   | 105/166 [00:00<00:00, 141.27it/s]
 73%|███████▎  | 1

[2m[36m(func pid=11576)[0m Epoch 00127: reducing learning rate of group 0 to 4.5771e-08.


 20%|██        | 34/166 [00:00<00:00, 161.36it/s]
 31%|███       | 51/166 [00:00<00:00, 161.92it/s]
 41%|████      | 68/166 [00:00<00:00, 153.74it/s]
 51%|█████     | 84/166 [00:00<00:00, 153.67it/s]
 60%|██████    | 100/166 [00:00<00:00, 154.71it/s]
 70%|██████▉   | 116/166 [00:00<00:00, 153.08it/s]
 80%|███████▉  | 132/166 [00:00<00:00, 149.88it/s]
 89%|████████▉ | 148/166 [00:00<00:00, 151.56it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
 77%|███████▋  | 37/48 [00:00<00:00, 364.90it/s]
100%|██████████| 48/48 [00:00<00:00, 342.25it/s]
  8%|▊         | 14/166 [00:00<00:01, 138.43it/s]
 17%|█▋        | 28/166 [00:00<00:01, 131.78it/s]
 25%|██▌       | 42/166 [00:00<00:00, 133.49it/s]
 34%|███▎      | 56/166 [00:00<00:00, 133.02it/s]
 44%|████▍     | 73/166 [00:00<00:00, 145.02it/s]
 54%|█████▍    | 90/166 [00:00<00:00, 150.19it/s]
 64%|██████▍   | 106/166 [00:00<00:00, 152.36it/s]
 74%|███████▍  | 123/166 [00:00<00:00, 155.94it/s]
 85%|████████▍ | 141/166 [00:00<00:00, 161.16it/s]
 95%|█

[2m[36m(func pid=11576)[0m Epoch 00133: reducing learning rate of group 0 to 2.2886e-08.


 21%|██        | 35/166 [00:00<00:00, 169.72it/s]
 31%|███▏      | 52/166 [00:00<00:00, 166.58it/s]
 42%|████▏     | 69/166 [00:00<00:00, 163.12it/s]
 52%|█████▏    | 86/166 [00:00<00:00, 160.36it/s]
 62%|██████▏   | 103/166 [00:00<00:00, 159.95it/s]
 72%|███████▏  | 120/166 [00:00<00:00, 155.71it/s]
 82%|████████▏ | 136/166 [00:00<00:00, 153.79it/s]
 93%|█████████▎| 154/166 [00:00<00:00, 158.81it/s]
100%|██████████| 48/48 [00:00<00:00, 456.84it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
 10%|▉         | 16/166 [00:00<00:00, 152.19it/s]
 19%|█▉        | 32/166 [00:00<00:00, 144.13it/s]
 28%|██▊       | 47/166 [00:00<00:00, 141.26it/s]
 37%|███▋      | 62/166 [00:00<00:00, 131.84it/s]
 46%|████▌     | 76/166 [00:00<00:00, 126.99it/s]
 55%|█████▌    | 92/166 [00:00<00:00, 137.07it/s]
 65%|██████▌   | 108/166 [00:00<00:00, 144.00it/s]
 75%|███████▌  | 125/166 [00:00<00:00, 151.50it/s]
 86%|████████▌ | 143/166 [00:00<00:00, 157.13it/s]
100%|██████████| 166/166 [00:01<00:00, 148.22it/s]
100

[2m[36m(func pid=11576)[0m Epoch 00139: reducing learning rate of group 0 to 1.1443e-08.


 19%|█▉        | 32/166 [00:00<00:00, 136.19it/s]
 28%|██▊       | 46/166 [00:00<00:00, 121.89it/s]
 36%|███▌      | 59/166 [00:00<00:00, 117.37it/s]
 46%|████▌     | 76/166 [00:00<00:00, 133.98it/s]
 55%|█████▌    | 92/166 [00:00<00:00, 142.06it/s]
 66%|██████▌   | 109/166 [00:00<00:00, 149.68it/s]
 75%|███████▌  | 125/166 [00:00<00:00, 151.55it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 420.57it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
 10%|▉         | 16/166 [00:00<00:00, 150.54it/s]
 19%|█▉        | 32/166 [00:00<00:00, 148.22it/s]
 28%|██▊       | 47/166 [00:00<00:00, 147.42it/s]
 37%|███▋      | 62/166 [00:00<00:00, 142.20it/s]
 47%|████▋     | 78/166 [00:00<00:00, 147.41it/s]
 58%|█████▊    | 97/166 [00:00<00:00, 159.13it/s]
 70%|██████▉   | 116/166 [00:00<00:00, 166.31it/s]
 80%|████████  | 133/166 [00:00<00:00, 166.78it/s]
 91%|█████████ | 151/166 [00:00<00:00, 168.58it/s]
100%|██████████| 166/166 [00:01<00:00, 161.68it/s]
  0%|          |

[2m[36m(func pid=14656)[0m Epoch 00056: reducing learning rate of group 0 to 2.5825e-03.


  0%|          | 0/166 [00:00<?, ?it/s]
  7%|▋         | 12/166 [00:00<00:01, 114.16it/s]
 14%|█▍        | 24/166 [00:00<00:01, 101.89it/s]
 21%|██        | 35/166 [00:00<00:01, 102.57it/s]
 28%|██▊       | 46/166 [00:00<00:01, 97.84it/s] 
 34%|███▎      | 56/166 [00:00<00:01, 97.28it/s]
 40%|███▉      | 66/166 [00:00<00:01, 94.96it/s]
 48%|████▊     | 79/166 [00:00<00:00, 104.84it/s]
 55%|█████▌    | 92/166 [00:00<00:00, 111.41it/s]
 64%|██████▍   | 106/166 [00:00<00:00, 117.52it/s]
 72%|███████▏  | 119/166 [00:01<00:00, 120.40it/s]
 80%|███████▉  | 132/166 [00:01<00:00, 120.74it/s]
 87%|████████▋ | 145/166 [00:01<00:00, 122.07it/s]
 95%|█████████▌| 158/166 [00:01<00:00, 120.55it/s]
100%|██████████| 166/166 [00:01<00:00, 112.44it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 416.50it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  8%|▊         | 13/166 [00:00<00:01, 122.64it/s]
 16%|█▌        | 26/166 [00:00<00:01, 122.46it/s]
 24%|██▍       | 40/166 [00:

[2m[36m(func pid=14656)[0m Epoch 00072: reducing learning rate of group 0 to 1.2913e-03.


  7%|▋         | 12/166 [00:00<00:01, 114.09it/s]
 15%|█▌        | 25/166 [00:00<00:01, 118.65it/s]
 22%|██▏       | 37/166 [00:00<00:01, 113.63it/s]
 30%|██▉       | 49/166 [00:00<00:01, 111.41it/s]
 37%|███▋      | 61/166 [00:00<00:00, 113.55it/s]
 52%|█████▏    | 86/166 [00:00<00:00, 117.96it/s]
 59%|█████▉    | 98/166 [00:00<00:00, 117.10it/s]
 67%|██████▋   | 111/166 [00:00<00:00, 117.84it/s]
 75%|███████▍  | 124/166 [00:01<00:00, 119.21it/s]
 82%|████████▏ | 136/166 [00:01<00:00, 118.17it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
 71%|███████   | 34/48 [00:00<00:00, 330.55it/s]
100%|██████████| 48/48 [00:00<00:00, 311.87it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  6%|▌         | 10/166 [00:00<00:01, 96.08it/s]
 12%|█▏        | 20/166 [00:00<00:01, 89.53it/s]
 18%|█▊        | 30/166 [00:00<00:01, 92.89it/s]
 25%|██▍       | 41/166 [00:00<00:01, 97.55it/s]
 31%|███       | 51/166 [00:00<00:01, 89.67it/s]
 45%|████▌     | 75/166 [00:00<00:00, 104.72it/s]
 52%|█████▏    | 87/166 [

[2m[36m(func pid=14656)[0m Epoch 00080: reducing learning rate of group 0 to 6.4563e-04.


 13%|█▎        | 21/166 [00:00<00:01, 96.14it/s]
 19%|█▊        | 31/166 [00:00<00:01, 94.14it/s]
 26%|██▌       | 43/166 [00:00<00:01, 100.81it/s]
 39%|███▉      | 65/166 [00:00<00:01, 98.42it/s] 
 47%|████▋     | 78/166 [00:00<00:00, 105.72it/s]
 55%|█████▍    | 91/166 [00:00<00:00, 110.25it/s]
 62%|██████▏   | 103/166 [00:00<00:00, 109.94it/s]
 69%|██████▉   | 115/166 [00:01<00:00, 112.22it/s]
 77%|███████▋  | 128/166 [00:01<00:00, 115.38it/s]
 84%|████████▍ | 140/166 [00:01<00:00, 116.09it/s]
 92%|█████████▏| 153/166 [00:01<00:00, 118.43it/s]
100%|██████████| 166/166 [00:01<00:00, 109.53it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 417.77it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  7%|▋         | 11/166 [00:00<00:01, 107.60it/s]
 13%|█▎        | 22/166 [00:00<00:01, 104.40it/s]
 20%|██        | 34/166 [00:00<00:01, 111.08it/s]
 28%|██▊       | 46/166 [00:00<00:01, 114.41it/s]
 43%|████▎     | 72/166 [00:00<00:00, 122.09it/s]
 51%|█████     | 8

[2m[36m(func pid=14656)[0m Epoch 00090: reducing learning rate of group 0 to 3.2282e-04.


  0%|          | 0/166 [00:00<?, ?it/s]
  8%|▊         | 13/166 [00:00<00:01, 125.08it/s]
 16%|█▌        | 26/166 [00:00<00:01, 121.35it/s]
 23%|██▎       | 39/166 [00:00<00:01, 110.25it/s]
 31%|███       | 51/166 [00:00<00:01, 106.17it/s]
 39%|███▊      | 64/166 [00:00<00:00, 110.96it/s]
 46%|████▌     | 76/166 [00:00<00:00, 105.26it/s]
 52%|█████▏    | 87/166 [00:00<00:00, 100.00it/s]
 60%|█████▉    | 99/166 [00:00<00:00, 103.29it/s]
 66%|██████▋   | 110/166 [00:01<00:00, 103.36it/s]
 73%|███████▎  | 122/166 [00:01<00:00, 106.05it/s]
 81%|████████  | 134/166 [00:01<00:00, 108.44it/s]
 87%|████████▋ | 145/166 [00:01<00:00, 108.31it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 393.54it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  7%|▋         | 11/166 [00:00<00:01, 99.97it/s]
 13%|█▎        | 21/166 [00:00<00:01, 97.20it/s]
 19%|█▉        | 32/166 [00:00<00:01, 101.06it/s]
 26%|██▌       | 43/166 [00:00<00:01, 95.02it/s] 
 33%|███▎      | 54/166 [00:00

[2m[36m(func pid=14656)[0m Epoch 00098: reducing learning rate of group 0 to 1.6141e-04.


  5%|▍         | 8/166 [00:00<00:01, 79.89it/s]
 18%|█▊        | 30/166 [00:00<00:01, 97.23it/s]
 24%|██▍       | 40/166 [00:00<00:01, 94.29it/s]
 30%|███       | 50/166 [00:00<00:01, 91.91it/s]
 37%|███▋      | 61/166 [00:00<00:01, 94.91it/s]
 43%|████▎     | 71/166 [00:00<00:01, 89.80it/s]
 50%|█████     | 83/166 [00:00<00:00, 96.22it/s]
 57%|█████▋    | 95/166 [00:00<00:00, 101.73it/s]
 65%|██████▌   | 108/166 [00:01<00:00, 107.36it/s]
 72%|███████▏  | 120/166 [00:01<00:00, 109.22it/s]
 80%|███████▉  | 132/166 [00:01<00:00, 110.65it/s]
 87%|████████▋ | 144/166 [00:01<00:00, 112.01it/s]
100%|██████████| 166/166 [00:01<00:00, 104.52it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 353.37it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  7%|▋         | 11/166 [00:00<00:01, 105.66it/s]
 13%|█▎        | 22/166 [00:00<00:01, 101.63it/s]
 20%|█▉        | 33/166 [00:00<00:01, 99.28it/s] 
 26%|██▌       | 43/166 [00:00<00:01, 94.16it/s]
 32%|███▏      | 53/166 [0

[2m[36m(func pid=14656)[0m Epoch 00115: reducing learning rate of group 0 to 8.0704e-05.


  0%|          | 0/166 [00:00<?, ?it/s]
  7%|▋         | 11/166 [00:00<00:01, 109.10it/s]
 13%|█▎        | 22/166 [00:00<00:01, 105.93it/s]
 20%|█▉        | 33/166 [00:00<00:01, 105.17it/s]
 27%|██▋       | 45/166 [00:00<00:01, 109.54it/s]
 34%|███▎      | 56/166 [00:00<00:01, 103.24it/s]
 40%|████      | 67/166 [00:00<00:00, 101.53it/s]
 48%|████▊     | 79/166 [00:00<00:00, 105.67it/s]
 55%|█████▍    | 91/166 [00:00<00:00, 108.96it/s]
 62%|██████▏   | 103/166 [00:00<00:00, 110.05it/s]
 69%|██████▉   | 115/166 [00:01<00:00, 89.64it/s] 
 77%|███████▋  | 127/166 [00:01<00:00, 97.22it/s]
 84%|████████▍ | 140/166 [00:01<00:00, 104.22it/s]
 92%|█████████▏| 153/166 [00:01<00:00, 108.21it/s]
100%|██████████| 166/166 [00:01<00:00, 104.94it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 347.26it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  7%|▋         | 12/166 [00:00<00:01, 113.92it/s]
 14%|█▍        | 24/166 [00:00<00:01, 102.06it/s]
 21%|██        | 35/166 [00

[2m[36m(func pid=14656)[0m Epoch 00121: reducing learning rate of group 0 to 4.0352e-05.


  7%|▋         | 12/166 [00:00<00:01, 117.50it/s]
 14%|█▍        | 24/166 [00:00<00:01, 102.06it/s]
 21%|██        | 35/166 [00:00<00:01, 97.64it/s] 
 28%|██▊       | 46/166 [00:00<00:01, 101.43it/s]
 34%|███▍      | 57/166 [00:00<00:01, 98.11it/s] 
 40%|████      | 67/166 [00:00<00:01, 93.41it/s]
 47%|████▋     | 78/166 [00:00<00:00, 96.65it/s]
 54%|█████▍    | 90/166 [00:00<00:00, 101.20it/s]
 61%|██████▏   | 102/166 [00:01<00:00, 104.67it/s]
 69%|██████▊   | 114/166 [00:01<00:00, 106.90it/s]
 77%|███████▋  | 127/166 [00:01<00:00, 111.10it/s]
 84%|████████▎ | 139/166 [00:01<00:00, 112.65it/s]
 91%|█████████ | 151/166 [00:01<00:00, 112.85it/s]
100%|██████████| 48/48 [00:00<00:00, 353.66it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  6%|▌         | 10/166 [00:00<00:01, 99.53it/s]
 13%|█▎        | 21/166 [00:00<00:01, 104.74it/s]
 19%|█▉        | 32/166 [00:00<00:01, 100.25it/s]
 26%|██▌       | 43/166 [00:00<00:01, 102.32it/s]
 33%|███▎      | 54/166 [00:00<00:01, 101.59it/s]
 39%|███▉

[2m[36m(func pid=14656)[0m Epoch 00127: reducing learning rate of group 0 to 2.0176e-05.


  7%|▋         | 12/166 [00:00<00:01, 113.98it/s]
 14%|█▍        | 24/166 [00:00<00:01, 101.68it/s]
 28%|██▊       | 46/166 [00:00<00:01, 106.14it/s]
 34%|███▍      | 57/166 [00:00<00:01, 103.50it/s]
 41%|████      | 68/166 [00:00<00:00, 102.04it/s]
 49%|████▉     | 81/166 [00:00<00:00, 109.25it/s]
 57%|█████▋    | 94/166 [00:00<00:00, 114.57it/s]
 64%|██████▍   | 107/166 [00:00<00:00, 118.11it/s]
 72%|███████▏  | 120/166 [00:01<00:00, 119.63it/s]
 80%|████████  | 133/166 [00:01<00:00, 119.32it/s]
 88%|████████▊ | 146/166 [00:01<00:00, 119.66it/s]
 96%|█████████▌| 159/166 [00:01<00:00, 120.77it/s]
100%|██████████| 166/166 [00:01<00:00, 114.12it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 371.37it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  6%|▌         | 10/166 [00:00<00:01, 98.05it/s]
 13%|█▎        | 22/166 [00:00<00:01, 106.20it/s]
 20%|█▉        | 33/166 [00:00<00:01, 102.23it/s]
 28%|██▊       | 46/166 [00:00<00:01, 110.18it/s]
 35%|███▍      | 

[2m[36m(func pid=14656)[0m Epoch 00133: reducing learning rate of group 0 to 1.0088e-05.


  7%|▋         | 11/166 [00:00<00:01, 106.69it/s]
 13%|█▎        | 22/166 [00:00<00:01, 91.66it/s] 
 19%|█▉        | 32/166 [00:00<00:01, 94.71it/s]
 25%|██▌       | 42/166 [00:00<00:01, 94.87it/s]
 33%|███▎      | 55/166 [00:00<00:01, 104.61it/s]
 40%|███▉      | 66/166 [00:00<00:01, 97.72it/s] 
 48%|████▊     | 80/166 [00:00<00:00, 106.74it/s]
 55%|█████▍    | 91/166 [00:00<00:00, 106.35it/s]
 63%|██████▎   | 104/166 [00:00<00:00, 112.28it/s]
 70%|██████▉   | 116/166 [00:01<00:00, 112.99it/s]
 78%|███████▊  | 129/166 [00:01<00:00, 116.13it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 408.41it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  7%|▋         | 11/166 [00:00<00:01, 106.62it/s]
 13%|█▎        | 22/166 [00:00<00:01, 107.32it/s]
 20%|█▉        | 33/166 [00:00<00:01, 101.92it/s]
 27%|██▋       | 45/166 [00:00<00:01, 107.24it/s]
 34%|███▎      | 56/166 [00:00<00:01, 97.96it/s] 
 41%|████      | 68/166 [00:00<00:00, 103.03it/s]
 57%|█████▋    | 94/1

[2m[36m(func pid=14656)[0m Epoch 00139: reducing learning rate of group 0 to 5.0440e-06.


 22%|██▏       | 36/166 [00:00<00:01, 107.89it/s]
 28%|██▊       | 47/166 [00:00<00:01, 101.34it/s]
 35%|███▍      | 58/166 [00:00<00:01, 103.09it/s]
 42%|████▏     | 69/166 [00:00<00:00, 97.11it/s] 
 49%|████▉     | 82/166 [00:00<00:00, 105.39it/s]
 57%|█████▋    | 95/166 [00:00<00:00, 110.31it/s]
 65%|██████▌   | 108/166 [00:01<00:00, 113.72it/s]
 80%|████████  | 133/166 [00:01<00:00, 116.81it/s]
 88%|████████▊ | 146/166 [00:01<00:00, 118.21it/s]
 95%|█████████▌| 158/166 [00:01<00:00, 116.93it/s]
100%|██████████| 166/166 [00:01<00:00, 111.30it/s]
  0%|          | 0/48 [00:00<?, ?it/s]
100%|██████████| 48/48 [00:00<00:00, 393.64it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  6%|▌         | 10/166 [00:00<00:01, 99.49it/s]
 13%|█▎        | 21/166 [00:00<00:01, 98.80it/s]
 19%|█▊        | 31/166 [00:00<00:01, 97.16it/s]
 25%|██▌       | 42/166 [00:00<00:01, 101.19it/s]
 32%|███▏      | 53/166 [00:00<00:01, 95.91it/s] 
 39%|███▉      | 65/166 [00:00<00:00, 101.29it/s]
 47%|████▋     | 78/

[2m[36m(func pid=14656)[0m Epoch 00145: reducing learning rate of group 0 to 2.5220e-06.


  0%|          | 0/166 [00:00<?, ?it/s]
  6%|▌         | 10/166 [00:00<00:01, 92.12it/s]
 12%|█▏        | 20/166 [00:00<00:01, 83.22it/s]
 19%|█▊        | 31/166 [00:00<00:01, 90.94it/s]
 25%|██▍       | 41/166 [00:00<00:01, 90.60it/s]
 37%|███▋      | 61/166 [00:00<00:01, 92.44it/s]
 45%|████▍     | 74/166 [00:00<00:00, 103.62it/s]
 52%|█████▏    | 87/166 [00:00<00:00, 111.63it/s]
 60%|██████    | 100/166 [00:00<00:00, 114.80it/s]
 67%|██████▋   | 112/166 [00:01<00:00, 116.31it/s]
 75%|███████▍  | 124/166 [00:01<00:00, 116.08it/s]
 82%|████████▏ | 136/166 [00:01<00:00, 115.80it/s]
 89%|████████▉ | 148/166 [00:01<00:00, 111.44it/s]
 96%|█████████▋| 160/166 [00:01<00:00, 112.29it/s]
 75%|███████▌  | 36/48 [00:00<00:00, 358.02it/s]
100%|██████████| 48/48 [00:00<00:00, 360.62it/s]
  0%|          | 0/166 [00:00<?, ?it/s]
  7%|▋         | 11/166 [00:00<00:01, 106.79it/s]
 13%|█▎        | 22/166 [00:00<00:01, 90.30it/s] 
 19%|█▉        | 32/166 [00:00<00:01, 87.94it/s]
 25%|██▍       | 41/16

[2m[36m(func pid=17508)[0m Epoch 00047: reducing learning rate of group 0 to 6.7248e-05.


 28%|██▊       | 38/138 [00:00<00:00, 185.33it/s]
 41%|████▏     | 57/138 [00:00<00:00, 185.95it/s]
 56%|█████▌    | 77/138 [00:00<00:00, 188.21it/s]
 70%|██████▉   | 96/138 [00:00<00:00, 186.25it/s]
 83%|████████▎ | 115/138 [00:00<00:00, 185.66it/s]
100%|██████████| 40/40 [00:00<00:00, 511.41it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 13%|█▎        | 18/138 [00:00<00:00, 177.12it/s]
 26%|██▌       | 36/138 [00:00<00:00, 159.73it/s]
 38%|███▊      | 53/138 [00:00<00:00, 153.58it/s]
 51%|█████▏    | 71/138 [00:00<00:00, 160.88it/s]
 76%|███████▌  | 105/138 [00:00<00:00, 152.68it/s]
 88%|████████▊ | 121/138 [00:00<00:00, 153.26it/s]
100%|██████████| 138/138 [00:00<00:00, 155.93it/s]
100%|██████████| 40/40 [00:00<00:00, 494.66it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 16/138 [00:00<00:00, 155.76it/s]
 36%|███▌      | 50/138 [00:00<00:00, 163.75it/s]
 49%|████▉     | 68/138 [00:00<00:00, 167.03it/s]
 64%|██████▍   | 88/138 [00:00<00:00, 177.27it/s]
 78%|███████▊  | 1

[2m[36m(func pid=17508)[0m Epoch 00059: reducing learning rate of group 0 to 3.3624e-05.


 13%|█▎        | 18/138 [00:00<00:00, 176.09it/s]
 26%|██▌       | 36/138 [00:00<00:00, 170.53it/s]
 39%|███▉      | 54/138 [00:00<00:00, 174.44it/s]
 52%|█████▏    | 72/138 [00:00<00:00, 176.59it/s]
 65%|██████▌   | 90/138 [00:00<00:00, 174.24it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 219.51it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 11%|█         | 15/138 [00:00<00:00, 144.01it/s]
 25%|██▍       | 34/138 [00:00<00:00, 164.74it/s]
 50%|█████     | 69/138 [00:00<00:00, 163.21it/s]
 62%|██████▏   | 86/138 [00:00<00:00, 151.64it/s]
 75%|███████▌  | 104/138 [00:00<00:00, 160.14it/s]
 90%|████████▉ | 124/138 [00:00<00:00, 170.94it/s]
100%|██████████| 138/138 [00:00<00:00, 165.46it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 524.02it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 14%|█▍        | 19/138 [00:00<00:00, 189.01it/s]
 28%|██▊       | 38/138 [00:00<00:00, 186.96it/s]
 42%|████▏     | 58/138 [00:00<00:00, 191

[2m[36m(func pid=17508)[0m Epoch 00068: reducing learning rate of group 0 to 1.6812e-05.


 13%|█▎        | 18/138 [00:00<00:00, 171.75it/s]
 26%|██▌       | 36/138 [00:00<00:00, 174.15it/s]
 39%|███▉      | 54/138 [00:00<00:00, 162.39it/s]
 53%|█████▎    | 73/138 [00:00<00:00, 171.84it/s]
 66%|██████▌   | 91/138 [00:00<00:00, 158.31it/s]
 78%|███████▊  | 108/138 [00:00<00:00, 149.90it/s]
 91%|█████████▏| 126/138 [00:00<00:00, 156.78it/s]
100%|██████████| 138/138 [00:00<00:00, 159.57it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 510.13it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 13%|█▎        | 18/138 [00:00<00:00, 172.50it/s]
 26%|██▌       | 36/138 [00:00<00:00, 170.01it/s]
 39%|███▉      | 54/138 [00:00<00:00, 172.41it/s]
 52%|█████▏    | 72/138 [00:00<00:00, 161.41it/s]
 64%|██████▍   | 89/138 [00:00<00:00, 162.64it/s]
 77%|███████▋  | 106/138 [00:00<00:00, 163.85it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 449.97it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 14%|█▍        | 19/138 [00:00<00:00, 18

[2m[36m(func pid=17508)[0m Epoch 00074: reducing learning rate of group 0 to 8.4061e-06.


  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 16/138 [00:00<00:00, 158.38it/s]
 36%|███▌      | 50/138 [00:00<00:00, 162.32it/s]
 49%|████▉     | 68/138 [00:00<00:00, 168.34it/s]
 62%|██████▏   | 85/138 [00:00<00:00, 167.22it/s]
 76%|███████▌  | 105/138 [00:00<00:00, 178.13it/s]
 91%|█████████ | 125/138 [00:00<00:00, 183.44it/s]
100%|██████████| 40/40 [00:00<00:00, 465.10it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
  9%|▊         | 12/138 [00:00<00:01, 118.40it/s]
 20%|██        | 28/138 [00:00<00:00, 138.75it/s]
 30%|███       | 42/138 [00:00<00:00, 135.59it/s]
 42%|████▏     | 58/138 [00:00<00:00, 144.96it/s]
 53%|█████▎    | 73/138 [00:00<00:00, 137.07it/s]
 63%|██████▎   | 87/138 [00:00<00:00, 126.30it/s]
 73%|███████▎  | 101/138 [00:00<00:00, 128.35it/s]
 83%|████████▎ | 115/138 [00:00<00:00, 130.99it/s]
100%|██████████| 138/138 [00:01<00:00, 134.84it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 476.69it/s]
  0%|          | 0/138 [00:0

[2m[36m(func pid=17508)[0m Epoch 00081: reducing learning rate of group 0 to 4.2030e-06.


 13%|█▎        | 18/138 [00:00<00:00, 178.03it/s]
 27%|██▋       | 37/138 [00:00<00:00, 177.91it/s]
 40%|███▉      | 55/138 [00:00<00:00, 172.62it/s]
 53%|█████▎    | 73/138 [00:00<00:00, 165.36it/s]
 65%|██████▌   | 90/138 [00:00<00:00, 162.56it/s]
 80%|███████▉  | 110/138 [00:00<00:00, 173.97it/s]
100%|██████████| 138/138 [00:00<00:00, 174.73it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 556.14it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 14%|█▍        | 20/138 [00:00<00:00, 192.10it/s]
 29%|██▉       | 40/138 [00:00<00:00, 193.66it/s]
 43%|████▎     | 60/138 [00:00<00:00, 189.78it/s]
 57%|█████▋    | 79/138 [00:00<00:00, 189.73it/s]
 85%|████████▍ | 117/138 [00:00<00:00, 187.96it/s]
100%|██████████| 40/40 [00:00<00:00, 539.41it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 10%|█         | 14/138 [00:00<00:00, 138.86it/s]
 22%|██▏       | 30/138 [00:00<00:00, 151.04it/s]
 33%|███▎      | 46/138 [00:00<00:00, 144.10it/s]
 45%|████▍     | 62/138 [00:00

[2m[36m(func pid=17508)[0m Epoch 00087: reducing learning rate of group 0 to 2.1015e-06.


 14%|█▍        | 19/138 [00:00<00:00, 188.52it/s]
 28%|██▊       | 39/138 [00:00<00:00, 190.64it/s]
 43%|████▎     | 59/138 [00:00<00:00, 185.81it/s]
 57%|█████▋    | 78/138 [00:00<00:00, 181.11it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 527.48it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 16/138 [00:00<00:00, 156.87it/s]
 25%|██▌       | 35/138 [00:00<00:00, 172.48it/s]
 38%|███▊      | 53/138 [00:00<00:00, 157.30it/s]
 64%|██████▍   | 88/138 [00:00<00:00, 163.92it/s]
 76%|███████▌  | 105/138 [00:00<00:00, 149.26it/s]
 89%|████████▉ | 123/138 [00:00<00:00, 156.89it/s]
100%|██████████| 138/138 [00:00<00:00, 160.67it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 419.56it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 17/138 [00:00<00:00, 164.46it/s]
 26%|██▌       | 36/138 [00:00<00:00, 174.38it/s]
 39%|███▉      | 54/138 [00:00<00:00, 168.67it/s]
 52%|█████▏    | 72/138 [00:00<00:00, 169

[2m[36m(func pid=17508)[0m Epoch 00093: reducing learning rate of group 0 to 1.0508e-06.


 11%|█         | 15/138 [00:00<00:00, 147.53it/s]
 25%|██▍       | 34/138 [00:00<00:00, 172.24it/s]
 38%|███▊      | 52/138 [00:00<00:00, 160.52it/s]
 51%|█████▏    | 71/138 [00:00<00:00, 168.83it/s]
 64%|██████▍   | 88/138 [00:00<00:00, 159.25it/s]
 76%|███████▌  | 105/138 [00:00<00:00, 148.31it/s]
 88%|████████▊ | 122/138 [00:00<00:00, 153.32it/s]
100%|██████████| 138/138 [00:00<00:00, 158.45it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 531.53it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 14%|█▍        | 19/138 [00:00<00:00, 187.31it/s]
 28%|██▊       | 38/138 [00:00<00:00, 179.35it/s]
 41%|████      | 56/138 [00:00<00:00, 174.16it/s]
 54%|█████▎    | 74/138 [00:00<00:00, 174.52it/s]
 67%|██████▋   | 92/138 [00:00<00:00, 174.62it/s]
 81%|████████  | 112/138 [00:00<00:00, 179.43it/s]
 96%|█████████▌| 132/138 [00:00<00:00, 184.18it/s]
100%|██████████| 138/138 [00:00<00:00, 179.73it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:

[2m[36m(func pid=17508)[0m Epoch 00099: reducing learning rate of group 0 to 5.2538e-07.


 12%|█▏        | 17/138 [00:00<00:00, 168.20it/s]
 25%|██▌       | 35/138 [00:00<00:00, 172.75it/s]
 39%|███▉      | 54/138 [00:00<00:00, 176.13it/s]
 52%|█████▏    | 72/138 [00:00<00:00, 169.58it/s]
 64%|██████▍   | 89/138 [00:00<00:00, 169.10it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 517.83it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 16/138 [00:00<00:00, 159.78it/s]
 25%|██▍       | 34/138 [00:00<00:00, 166.99it/s]
 37%|███▋      | 51/138 [00:00<00:00, 163.10it/s]
 49%|████▉     | 68/138 [00:00<00:00, 159.64it/s]
 62%|██████▏   | 86/138 [00:00<00:00, 162.18it/s]
 75%|███████▍  | 103/138 [00:00<00:00, 158.11it/s]
 89%|████████▉ | 123/138 [00:00<00:00, 170.07it/s]
100%|██████████| 138/138 [00:00<00:00, 165.89it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 571.62it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 14%|█▍        | 20/138 [00:00<00:00, 190.93it/s]
 29%|██▉       | 40/138 [00:00<00:00, 189

[2m[36m(func pid=17508)[0m Epoch 00105: reducing learning rate of group 0 to 2.6269e-07.


 12%|█▏        | 16/138 [00:00<00:00, 156.92it/s]
 36%|███▌      | 50/138 [00:00<00:00, 132.18it/s]
 49%|████▉     | 68/138 [00:00<00:00, 146.09it/s]
 61%|██████    | 84/138 [00:00<00:00, 140.85it/s]
 75%|███████▌  | 104/138 [00:00<00:00, 156.52it/s]
100%|██████████| 138/138 [00:00<00:00, 155.26it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 556.89it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 13%|█▎        | 18/138 [00:00<00:00, 171.05it/s]
 26%|██▌       | 36/138 [00:00<00:00, 174.24it/s]
 54%|█████▎    | 74/138 [00:00<00:00, 178.93it/s]
 67%|██████▋   | 93/138 [00:00<00:00, 180.19it/s]
 81%|████████  | 112/138 [00:00<00:00, 180.44it/s]
100%|██████████| 138/138 [00:00<00:00, 182.09it/s]
100%|██████████| 40/40 [00:00<00:00, 570.35it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 14%|█▍        | 19/138 [00:00<00:00, 187.74it/s]
 28%|██▊       | 39/138 [00:00<00:00, 191.78it/s]
 43%|████▎     | 59/138 [00:00<00:00, 192.10it/s]
 57%|█████▋    | 79/138 [00:0

[2m[36m(func pid=17508)[0m Epoch 00111: reducing learning rate of group 0 to 1.3134e-07.


 28%|██▊       | 38/138 [00:00<00:00, 183.95it/s]
 41%|████▏     | 57/138 [00:00<00:00, 174.06it/s]
 54%|█████▍    | 75/138 [00:00<00:00, 174.14it/s]
 67%|██████▋   | 93/138 [00:00<00:00, 172.18it/s]
 80%|████████  | 111/138 [00:00<00:00, 174.24it/s]
100%|██████████| 138/138 [00:00<00:00, 159.66it/s]
100%|██████████| 40/40 [00:00<00:00, 524.91it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 13%|█▎        | 18/138 [00:00<00:00, 169.79it/s]
 26%|██▌       | 36/138 [00:00<00:00, 172.63it/s]
 54%|█████▎    | 74/138 [00:00<00:00, 183.42it/s]
 68%|██████▊   | 94/138 [00:00<00:00, 186.68it/s]
 82%|████████▏ | 113/138 [00:00<00:00, 187.77it/s]
100%|██████████| 40/40 [00:00<00:00, 479.83it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 17/138 [00:00<00:00, 163.87it/s]
 25%|██▍       | 34/138 [00:00<00:00, 163.57it/s]
 38%|███▊      | 52/138 [00:00<00:00, 169.19it/s]
 50%|█████     | 69/138 [00:00<00:00, 156.26it/s]
 64%|██████▍   | 88/138 [00:00<00:00, 165.00it/s]
 76%|███████▌  | 10

[2m[36m(func pid=17508)[0m Epoch 00117: reducing learning rate of group 0 to 6.5672e-08.


 28%|██▊       | 39/138 [00:00<00:00, 193.23it/s]
 43%|████▎     | 59/138 [00:00<00:00, 193.63it/s]
 57%|█████▋    | 79/138 [00:00<00:00, 194.76it/s]
 72%|███████▏  | 99/138 [00:00<00:00, 195.26it/s]
 86%|████████▌ | 119/138 [00:00<00:00, 194.87it/s]
100%|██████████| 138/138 [00:00<00:00, 193.69it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 550.79it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 11%|█         | 15/138 [00:00<00:00, 149.06it/s]
 33%|███▎      | 46/138 [00:00<00:00, 122.45it/s]
 46%|████▋     | 64/138 [00:00<00:00, 141.22it/s]
 57%|█████▋    | 79/138 [00:00<00:00, 141.26it/s]
 70%|███████   | 97/138 [00:00<00:00, 151.95it/s]
 83%|████████▎ | 115/138 [00:00<00:00, 159.51it/s]
100%|██████████| 138/138 [00:00<00:00, 148.92it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 499.62it/s]
 13%|█▎        | 18/138 [00:00<00:00, 177.40it/s]
 26%|██▌       | 36/138 [00:00<00:00, 178.88it/s]
 40%|███▉      | 55/138 [00:00

[2m[36m(func pid=17508)[0m Epoch 00123: reducing learning rate of group 0 to 3.2836e-08.


 13%|█▎        | 18/138 [00:00<00:00, 171.47it/s]
 26%|██▌       | 36/138 [00:00<00:00, 160.93it/s]
 38%|███▊      | 53/138 [00:00<00:00, 164.69it/s]
 51%|█████     | 70/138 [00:00<00:00, 157.95it/s]
 64%|██████▍   | 88/138 [00:00<00:00, 161.40it/s]
 76%|███████▌  | 105/138 [00:00<00:00, 147.09it/s]
 89%|████████▉ | 123/138 [00:00<00:00, 154.48it/s]
100%|██████████| 138/138 [00:00<00:00, 158.87it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 555.95it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 13%|█▎        | 18/138 [00:00<00:00, 172.39it/s]
 26%|██▌       | 36/138 [00:00<00:00, 173.15it/s]
 40%|███▉      | 55/138 [00:00<00:00, 176.42it/s]
 53%|█████▎    | 73/138 [00:00<00:00, 175.04it/s]
 66%|██████▌   | 91/138 [00:00<00:00, 174.37it/s]
 79%|███████▉  | 109/138 [00:00<00:00, 175.69it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 496.24it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 16/138 [00:00<00:00, 15

[2m[36m(func pid=17508)[0m Epoch 00129: reducing learning rate of group 0 to 1.6418e-08.


 25%|██▌       | 35/138 [00:00<00:00, 170.85it/s]
 38%|███▊      | 53/138 [00:00<00:00, 173.33it/s]
 51%|█████▏    | 71/138 [00:00<00:00, 171.38it/s]
 65%|██████▌   | 90/138 [00:00<00:00, 176.55it/s]
 79%|███████▉  | 109/138 [00:00<00:00, 180.43it/s]
 93%|█████████▎| 129/138 [00:00<00:00, 184.61it/s]
100%|██████████| 138/138 [00:00<00:00, 179.85it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 536.46it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 17/138 [00:00<00:00, 168.44it/s]
 25%|██▍       | 34/138 [00:00<00:00, 165.74it/s]
 37%|███▋      | 51/138 [00:00<00:00, 158.73it/s]
 49%|████▊     | 67/138 [00:00<00:00, 154.88it/s]
 62%|██████▏   | 85/138 [00:00<00:00, 160.76it/s]
 74%|███████▍  | 102/138 [00:00<00:00, 154.18it/s]
 88%|████████▊ | 122/138 [00:00<00:00, 166.72it/s]
100%|██████████| 138/138 [00:00<00:00, 165.41it/s]
100%|██████████| 40/40 [00:00<00:00, 563.03it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 13%|█▎        | 18/138 [00

[2m[36m(func pid=7648)[0m Epoch 00055: reducing learning rate of group 0 to 7.5261e-05.


  6%|▌         | 17/276 [00:00<00:01, 161.64it/s]
 19%|█▉        | 52/276 [00:00<00:01, 163.46it/s]
 25%|██▌       | 69/276 [00:00<00:01, 156.00it/s]
 31%|███       | 85/276 [00:00<00:01, 157.20it/s]
 37%|███▋      | 101/276 [00:00<00:01, 144.50it/s]
 43%|████▎     | 119/276 [00:00<00:01, 154.33it/s]
 57%|█████▋    | 156/276 [00:00<00:00, 168.90it/s]
 63%|██████▎   | 175/276 [00:01<00:00, 174.60it/s]
 70%|███████   | 194/276 [00:01<00:00, 178.32it/s]
 77%|███████▋  | 213/276 [00:01<00:00, 178.95it/s]
 84%|████████▍ | 232/276 [00:01<00:00, 181.12it/s]
 91%|█████████ | 251/276 [00:01<00:00, 183.22it/s]
100%|██████████| 276/276 [00:01<00:00, 170.43it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
 92%|█████████▏| 73/79 [00:00<00:00, 712.33it/s]
100%|██████████| 79/79 [00:00<00:00, 716.26it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  7%|▋         | 19/276 [00:00<00:01, 187.60it/s]
 14%|█▍        | 38/276 [00:00<00:01, 187.03it/s]
 21%|██        | 57/276 [00:00<00:01, 187.41it/s]
 28%|██▊      

[2m[36m(func pid=7648)[0m Epoch 00061: reducing learning rate of group 0 to 3.7630e-05.


 12%|█▏        | 34/276 [00:00<00:01, 162.85it/s]
 18%|█▊        | 51/276 [00:00<00:01, 164.24it/s]
 25%|██▌       | 70/276 [00:00<00:01, 173.19it/s]
 38%|███▊      | 105/276 [00:00<00:01, 157.26it/s]
 45%|████▍     | 123/276 [00:00<00:00, 163.14it/s]
 52%|█████▏    | 144/276 [00:00<00:00, 175.78it/s]
 59%|█████▉    | 164/276 [00:00<00:00, 182.83it/s]
 75%|███████▍  | 206/276 [00:01<00:00, 192.24it/s]
 82%|████████▏ | 227/276 [00:01<00:00, 197.30it/s]
 90%|████████▉ | 248/276 [00:01<00:00, 199.96it/s]
100%|██████████| 276/276 [00:01<00:00, 183.15it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
100%|██████████| 79/79 [00:00<00:00, 693.25it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  7%|▋         | 20/276 [00:00<00:01, 191.72it/s]
 14%|█▍        | 40/276 [00:00<00:01, 194.92it/s]
 22%|██▏       | 61/276 [00:00<00:01, 199.17it/s]
 30%|██▉       | 82/276 [00:00<00:00, 202.26it/s]
 37%|███▋      | 103/276 [00:00<00:00, 200.75it/s]
 45%|████▍     | 124/276 [00:00<00:00, 200.14it/s]
 53%|█████▎ 

[2m[36m(func pid=7648)[0m Epoch 00069: reducing learning rate of group 0 to 1.8815e-05.


 12%|█▏        | 32/276 [00:00<00:01, 156.05it/s]
 17%|█▋        | 48/276 [00:00<00:01, 157.13it/s]
 24%|██▎       | 65/276 [00:00<00:01, 161.68it/s]
 30%|███       | 84/276 [00:00<00:01, 169.35it/s]
 37%|███▋      | 101/276 [00:00<00:01, 150.86it/s]
 43%|████▎     | 119/276 [00:00<00:00, 157.87it/s]
 51%|█████     | 140/276 [00:00<00:00, 171.72it/s]
 58%|█████▊    | 161/276 [00:00<00:00, 180.70it/s]
 66%|██████▌   | 182/276 [00:01<00:00, 187.18it/s]
 74%|███████▎  | 203/276 [00:01<00:00, 192.12it/s]
 81%|████████  | 224/276 [00:01<00:00, 195.59it/s]
 88%|████████▊ | 244/276 [00:01<00:00, 195.86it/s]
 77%|███████▋  | 61/79 [00:00<00:00, 603.02it/s]
100%|██████████| 79/79 [00:00<00:00, 623.56it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  6%|▌         | 16/276 [00:00<00:01, 157.41it/s]
 13%|█▎        | 35/276 [00:00<00:01, 171.74it/s]
 19%|█▉        | 53/276 [00:00<00:01, 166.91it/s]
 25%|██▌       | 70/276 [00:00<00:01, 165.70it/s]
 32%|███▏      | 88/276 [00:00<00:01, 168.14it/s]
 38%

[2m[36m(func pid=7648)[0m Epoch 00075: reducing learning rate of group 0 to 9.4076e-06.


  8%|▊         | 21/276 [00:00<00:01, 200.78it/s]
 22%|██▏       | 61/276 [00:00<00:01, 181.16it/s]
 29%|██▉       | 80/276 [00:00<00:01, 173.67it/s]
 36%|███▌      | 100/276 [00:00<00:00, 179.96it/s]
 43%|████▎     | 119/276 [00:00<00:00, 168.53it/s]
 50%|████▉     | 137/276 [00:00<00:00, 170.25it/s]
 63%|██████▎   | 174/276 [00:00<00:00, 173.86it/s]
 71%|███████   | 195/276 [00:01<00:00, 182.89it/s]
 78%|███████▊  | 216/276 [00:01<00:00, 189.35it/s]
 86%|████████▌ | 237/276 [00:01<00:00, 193.65it/s]
 93%|█████████▎| 257/276 [00:01<00:00, 193.69it/s]
100%|██████████| 276/276 [00:01<00:00, 183.75it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
100%|██████████| 79/79 [00:00<00:00, 663.50it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
 14%|█▍        | 40/276 [00:00<00:01, 181.88it/s]
 21%|██▏       | 59/276 [00:00<00:01, 180.69it/s]
 28%|██▊       | 78/276 [00:00<00:01, 182.64it/s]
 35%|███▌      | 97/276 [00:00<00:01, 172.65it/s]
 42%|████▏     | 117/276 [00:00<00:00, 178.52it/s]
 50%|████▉  

[2m[36m(func pid=7648)[0m Epoch 00085: reducing learning rate of group 0 to 4.7038e-06.


 13%|█▎        | 36/276 [00:00<00:01, 157.93it/s]
 19%|█▉        | 53/276 [00:00<00:01, 159.59it/s]
 25%|██▌       | 70/276 [00:00<00:01, 151.61it/s]
 32%|███▏      | 88/276 [00:00<00:01, 157.24it/s]
 38%|███▊      | 104/276 [00:00<00:01, 143.32it/s]
 45%|████▍     | 123/276 [00:00<00:00, 155.40it/s]
 51%|█████▏    | 142/276 [00:00<00:00, 163.46it/s]
 58%|█████▊    | 160/276 [00:01<00:00, 166.63it/s]
 64%|██████▍   | 177/276 [00:01<00:00, 167.49it/s]
 71%|███████   | 195/276 [00:01<00:00, 169.61it/s]
 78%|███████▊  | 215/276 [00:01<00:00, 176.47it/s]
 84%|████████▍ | 233/276 [00:01<00:00, 176.79it/s]
 91%|█████████ | 251/276 [00:01<00:00, 176.98it/s]
100%|██████████| 276/276 [00:01<00:00, 167.55it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
100%|██████████| 79/79 [00:00<00:00, 699.86it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  7%|▋         | 18/276 [00:00<00:01, 179.74it/s]
 13%|█▎        | 36/276 [00:00<00:01, 179.04it/s]
 20%|█▉        | 55/276 [00:00<00:01, 180.91it/s]
 27%|██▋    

[2m[36m(func pid=7648)[0m Epoch 00091: reducing learning rate of group 0 to 2.3519e-06.


  7%|▋         | 18/276 [00:00<00:01, 175.89it/s]
 13%|█▎        | 36/276 [00:00<00:01, 157.65it/s]
 20%|█▉        | 54/276 [00:00<00:01, 165.59it/s]
 26%|██▌       | 71/276 [00:00<00:01, 163.18it/s]
 32%|███▏      | 89/276 [00:00<00:01, 168.21it/s]
 39%|███▉      | 107/276 [00:00<00:00, 171.45it/s]
 46%|████▌     | 126/276 [00:00<00:00, 175.66it/s]
 60%|█████▉    | 165/276 [00:00<00:00, 182.30it/s]
 67%|██████▋   | 185/276 [00:01<00:00, 184.41it/s]
 74%|███████▍  | 205/276 [00:01<00:00, 187.71it/s]
 82%|████████▏ | 226/276 [00:01<00:00, 193.17it/s]
 89%|████████▉ | 246/276 [00:01<00:00, 194.62it/s]
100%|██████████| 276/276 [00:01<00:00, 179.71it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
100%|██████████| 79/79 [00:00<00:00, 754.02it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  7%|▋         | 20/276 [00:00<00:01, 190.92it/s]
 14%|█▍        | 40/276 [00:00<00:01, 191.72it/s]
 29%|██▉       | 80/276 [00:00<00:01, 194.34it/s]
 37%|███▋      | 101/276 [00:00<00:00, 196.70it/s]
 44%|████▍   

[2m[36m(func pid=7648)[0m Epoch 00097: reducing learning rate of group 0 to 1.1760e-06.


  7%|▋         | 20/276 [00:00<00:01, 193.17it/s]
 14%|█▍        | 40/276 [00:00<00:01, 156.64it/s]
 21%|██        | 57/276 [00:00<00:01, 150.43it/s]
 26%|██▋       | 73/276 [00:00<00:01, 151.70it/s]
 32%|███▏      | 89/276 [00:00<00:01, 139.06it/s]
 38%|███▊      | 106/276 [00:00<00:01, 146.83it/s]
 45%|████▍     | 124/276 [00:00<00:00, 154.46it/s]
 52%|█████▏    | 143/276 [00:00<00:00, 163.57it/s]
 58%|█████▊    | 160/276 [00:01<00:00, 164.55it/s]
 65%|██████▌   | 180/276 [00:01<00:00, 172.55it/s]
 72%|███████▏  | 198/276 [00:01<00:00, 173.19it/s]
 79%|███████▉  | 218/276 [00:01<00:00, 178.99it/s]
 93%|█████████▎| 257/276 [00:01<00:00, 185.01it/s]
100%|██████████| 276/276 [00:01<00:00, 168.97it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
100%|██████████| 79/79 [00:00<00:00, 758.34it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  7%|▋         | 19/276 [00:00<00:01, 187.36it/s]
 14%|█▍        | 40/276 [00:00<00:01, 196.94it/s]
 30%|██▉       | 82/276 [00:00<00:00, 201.85it/s]
 37%|███▋    

[2m[36m(func pid=7648)[0m Epoch 00105: reducing learning rate of group 0 to 5.8798e-07.


  5%|▌         | 15/276 [00:00<00:01, 147.06it/s]
 13%|█▎        | 35/276 [00:00<00:01, 175.02it/s]
 20%|█▉        | 54/276 [00:00<00:01, 175.97it/s]
 26%|██▋       | 73/276 [00:00<00:01, 179.41it/s]
 33%|███▎      | 91/276 [00:00<00:01, 170.17it/s]
 39%|███▉      | 109/276 [00:00<00:00, 167.89it/s]
 46%|████▌     | 126/276 [00:00<00:00, 167.32it/s]
 53%|█████▎    | 146/276 [00:00<00:00, 176.36it/s]
 60%|██████    | 166/276 [00:00<00:00, 181.81it/s]
 68%|██████▊   | 187/276 [00:01<00:00, 187.75it/s]
 75%|███████▌  | 207/276 [00:01<00:00, 191.04it/s]
 82%|████████▏ | 227/276 [00:01<00:00, 192.79it/s]
 90%|████████▉ | 248/276 [00:01<00:00, 195.67it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
100%|██████████| 79/79 [00:00<00:00, 735.21it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  7%|▋         | 19/276 [00:00<00:01, 179.28it/s]
 13%|█▎        | 37/276 [00:00<00:01, 170.12it/s]
 20%|█▉        | 55/276 [00:00<00:01, 169.22it/s]
 27%|██▋       | 75/276 [00:00<00:01, 180.72it/s]
 34%|███▍     

[2m[36m(func pid=7648)[0m Epoch 00115: reducing learning rate of group 0 to 2.9399e-07.


  6%|▌         | 17/276 [00:00<00:01, 168.22it/s]
 12%|█▏        | 34/276 [00:00<00:01, 148.63it/s]
 26%|██▌       | 71/276 [00:00<00:01, 170.76it/s]
 32%|███▏      | 89/276 [00:00<00:01, 162.51it/s]
 39%|███▉      | 109/276 [00:00<00:00, 174.03it/s]
 46%|████▋     | 128/276 [00:00<00:00, 177.29it/s]
 54%|█████▍    | 149/276 [00:00<00:00, 184.66it/s]
 68%|██████▊   | 189/276 [00:01<00:00, 189.56it/s]
 76%|███████▌  | 209/276 [00:01<00:00, 190.67it/s]
 83%|████████▎ | 229/276 [00:01<00:00, 193.35it/s]
 90%|█████████ | 249/276 [00:01<00:00, 194.43it/s]
100%|██████████| 276/276 [00:01<00:00, 182.54it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
 96%|█████████▌| 76/79 [00:00<00:00, 753.75it/s]
100%|██████████| 79/79 [00:00<00:00, 743.48it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  7%|▋         | 19/276 [00:00<00:01, 186.17it/s]
 14%|█▍        | 40/276 [00:00<00:01, 196.77it/s]
 22%|██▏       | 60/276 [00:00<00:01, 194.73it/s]
 29%|██▉       | 80/276 [00:00<00:01, 187.54it/s]
 36%|███▌      

[2m[36m(func pid=7648)[0m Epoch 00121: reducing learning rate of group 0 to 1.4699e-07.


  7%|▋         | 20/276 [00:00<00:01, 196.00it/s]
 14%|█▍        | 40/276 [00:00<00:01, 160.77it/s]
 21%|██        | 57/276 [00:00<00:01, 151.07it/s]
 26%|██▋       | 73/276 [00:00<00:01, 137.52it/s]
 32%|███▏      | 88/276 [00:00<00:01, 139.23it/s]
 37%|███▋      | 103/276 [00:00<00:01, 131.51it/s]
 43%|████▎     | 120/276 [00:00<00:01, 141.99it/s]
 51%|█████     | 140/276 [00:00<00:00, 158.64it/s]
 57%|█████▋    | 158/276 [00:01<00:00, 163.74it/s]
 64%|██████▍   | 177/276 [00:01<00:00, 169.52it/s]
 71%|███████   | 195/276 [00:01<00:00, 166.89it/s]
 78%|███████▊  | 214/276 [00:01<00:00, 173.51it/s]
 85%|████████▍ | 234/276 [00:01<00:00, 179.14it/s]
 92%|█████████▏| 254/276 [00:01<00:00, 185.12it/s]
100%|██████████| 276/276 [00:01<00:00, 164.97it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
100%|██████████| 79/79 [00:00<00:00, 683.64it/s]
  7%|▋         | 19/276 [00:00<00:01, 182.95it/s]
 14%|█▍        | 38/276 [00:00<00:01, 178.79it/s]
 20%|██        | 56/276 [00:00<00:01, 179.21it/s]
 2

[2m[36m(func pid=7648)[0m Epoch 00127: reducing learning rate of group 0 to 7.3497e-08.


  6%|▌         | 17/276 [00:00<00:01, 166.66it/s]
 12%|█▏        | 34/276 [00:00<00:01, 143.37it/s]
 18%|█▊        | 51/276 [00:00<00:01, 152.07it/s]
 25%|██▌       | 69/276 [00:00<00:01, 160.99it/s]
 31%|███       | 86/276 [00:00<00:01, 147.56it/s]
 37%|███▋      | 102/276 [00:00<00:01, 149.51it/s]
 44%|████▍     | 122/276 [00:00<00:00, 161.95it/s]
 51%|█████     | 141/276 [00:00<00:00, 166.07it/s]
 63%|██████▎   | 175/276 [00:01<00:00, 162.15it/s]
 70%|██████▉   | 192/276 [00:01<00:00, 162.49it/s]
 76%|███████▌  | 210/276 [00:01<00:00, 166.18it/s]
 82%|████████▏ | 227/276 [00:01<00:00, 155.01it/s]
 88%|████████▊ | 244/276 [00:01<00:00, 157.12it/s]
100%|██████████| 276/276 [00:01<00:00, 157.29it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
100%|██████████| 79/79 [00:00<00:00, 652.16it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  6%|▌         | 17/276 [00:00<00:01, 164.55it/s]
 13%|█▎        | 35/276 [00:00<00:01, 172.61it/s]
 19%|█▉        | 53/276 [00:00<00:01, 172.18it/s]
 26%|██▌     

[2m[36m(func pid=7648)[0m Epoch 00133: reducing learning rate of group 0 to 3.6749e-08.


  7%|▋         | 19/276 [00:00<00:01, 182.84it/s]
 14%|█▍        | 38/276 [00:00<00:01, 166.85it/s]
 20%|██        | 56/276 [00:00<00:01, 171.55it/s]
 27%|██▋       | 74/276 [00:00<00:01, 173.09it/s]
 33%|███▎      | 92/276 [00:00<00:01, 158.29it/s]
 39%|███▉      | 109/276 [00:00<00:01, 144.41it/s]
 46%|████▌     | 126/276 [00:00<00:01, 149.08it/s]
 52%|█████▏    | 144/276 [00:00<00:00, 156.58it/s]
 59%|█████▉    | 164/276 [00:01<00:00, 167.70it/s]
 67%|██████▋   | 184/276 [00:01<00:00, 176.50it/s]
 74%|███████▍  | 205/276 [00:01<00:00, 184.09it/s]
 82%|████████▏ | 225/276 [00:01<00:00, 188.31it/s]
 89%|████████▉ | 246/276 [00:01<00:00, 192.32it/s]
100%|██████████| 276/276 [00:01<00:00, 175.79it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
100%|██████████| 79/79 [00:00<00:00, 788.22it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  7%|▋         | 20/276 [00:00<00:01, 193.80it/s]
 14%|█▍        | 40/276 [00:00<00:01, 195.10it/s]
 22%|██▏       | 61/276 [00:00<00:01, 198.47it/s]
 37%|███▋    

[2m[36m(func pid=7648)[0m Epoch 00143: reducing learning rate of group 0 to 1.8374e-08.


 14%|█▍        | 40/276 [00:00<00:01, 193.49it/s]
 22%|██▏       | 60/276 [00:00<00:01, 185.34it/s]
 29%|██▊       | 79/276 [00:00<00:01, 170.47it/s]
 36%|███▌      | 99/276 [00:00<00:00, 178.55it/s]
 43%|████▎     | 119/276 [00:00<00:00, 182.46it/s]
 50%|█████     | 138/276 [00:00<00:00, 183.00it/s]
 57%|█████▋    | 158/276 [00:00<00:00, 185.89it/s]
 64%|██████▍   | 178/276 [00:00<00:00, 187.03it/s]
 72%|███████▏  | 198/276 [00:01<00:00, 188.90it/s]
 79%|███████▉  | 218/276 [00:01<00:00, 190.53it/s]
 93%|█████████▎| 257/276 [00:01<00:00, 182.08it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
100%|██████████| 79/79 [00:00<00:00, 706.69it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  7%|▋         | 18/276 [00:00<00:01, 178.61it/s]
 13%|█▎        | 36/276 [00:00<00:01, 160.33it/s]
 20%|█▉        | 55/276 [00:00<00:01, 169.56it/s]
 26%|██▋       | 73/276 [00:00<00:01, 162.28it/s]
 33%|███▎      | 92/276 [00:00<00:01, 169.37it/s]
 40%|███▉      | 110/276 [00:00<00:00, 167.48it/s]
 47%|████▋    

[2m[36m(func pid=7788)[0m Epoch 00035: reducing learning rate of group 0 to 4.2221e-03.


 10%|█         | 14/138 [00:00<00:00, 139.52it/s]
 32%|███▏      | 44/138 [00:00<00:00, 144.47it/s]
 43%|████▎     | 59/138 [00:00<00:00, 136.07it/s]
 54%|█████▍    | 75/138 [00:00<00:00, 141.29it/s]
 65%|██████▌   | 90/138 [00:00<00:00, 135.74it/s]
 76%|███████▌  | 105/138 [00:00<00:00, 136.86it/s]
 86%|████████▌ | 119/138 [00:00<00:00, 137.73it/s]
 96%|█████████▋| 133/138 [00:00<00:00, 135.92it/s]
100%|██████████| 138/138 [00:01<00:00, 136.67it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 357.53it/s]
 11%|█         | 15/138 [00:00<00:00, 144.14it/s]
 22%|██▏       | 30/138 [00:00<00:00, 118.00it/s]
 42%|████▏     | 58/138 [00:00<00:00, 121.57it/s]
 53%|█████▎    | 73/138 [00:00<00:00, 128.95it/s]
 64%|██████▍   | 88/138 [00:00<00:00, 133.51it/s]
 75%|███████▌  | 104/138 [00:00<00:00, 141.57it/s]
 88%|████████▊ | 121/138 [00:00<00:00, 147.88it/s]
100%|██████████| 138/138 [00:00<00:00, 138.26it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████|

[2m[36m(func pid=7788)[0m Epoch 00056: reducing learning rate of group 0 to 2.1110e-03.


 12%|█▏        | 16/138 [00:00<00:00, 151.14it/s]
 35%|███▍      | 48/138 [00:00<00:00, 147.92it/s]
 46%|████▋     | 64/138 [00:00<00:00, 149.06it/s]
 59%|█████▊    | 81/138 [00:00<00:00, 155.31it/s]
 71%|███████   | 98/138 [00:00<00:00, 159.13it/s]
 83%|████████▎ | 115/138 [00:00<00:00, 162.54it/s]
 96%|█████████▌| 132/138 [00:00<00:00, 164.35it/s]
100%|██████████| 138/138 [00:00<00:00, 158.33it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 417.52it/s]
 12%|█▏        | 17/138 [00:00<00:00, 168.77it/s]
 25%|██▌       | 35/138 [00:00<00:00, 171.22it/s]
 38%|███▊      | 53/138 [00:00<00:00, 172.88it/s]
 51%|█████▏    | 71/138 [00:00<00:00, 172.97it/s]
 64%|██████▍   | 89/138 [00:00<00:00, 172.88it/s]
 78%|███████▊  | 107/138 [00:00<00:00, 172.59it/s]
 91%|█████████ | 125/138 [00:00<00:00, 171.66it/s]
100%|██████████| 138/138 [00:00<00:00, 172.41it/s]
 28%|██▊       | 11/40 [00:00<00:00, 108.32it/s]
100%|██████████| 40/40 [00:00<00:00, 233.33it/s]
 12%|█▏ 

[2m[36m(func pid=7788)[0m Epoch 00064: reducing learning rate of group 0 to 1.0555e-03.


 24%|██▍       | 33/138 [00:00<00:00, 163.49it/s]
 36%|███▌      | 50/138 [00:00<00:00, 148.78it/s]
 49%|████▊     | 67/138 [00:00<00:00, 155.24it/s]
 62%|██████▏   | 85/138 [00:00<00:00, 160.67it/s]
 74%|███████▍  | 102/138 [00:00<00:00, 160.64it/s]
100%|██████████| 40/40 [00:00<00:00, 359.79it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 16/138 [00:00<00:00, 151.54it/s]
 23%|██▎       | 32/138 [00:00<00:00, 147.48it/s]
 35%|███▍      | 48/138 [00:00<00:00, 151.76it/s]
 46%|████▋     | 64/138 [00:00<00:00, 149.18it/s]
 57%|█████▋    | 79/138 [00:00<00:00, 149.41it/s]
 68%|██████▊   | 94/138 [00:00<00:00, 143.97it/s]
 79%|███████▉  | 109/138 [00:00<00:00, 145.25it/s]
 90%|████████▉ | 124/138 [00:00<00:00, 145.40it/s]
100%|██████████| 138/138 [00:00<00:00, 147.30it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 347.77it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 10%|█         | 14/138 [00:00<00:00, 134.43it/s]
 21%|██        | 29/138 [00:0

[2m[36m(func pid=7788)[0m Epoch 00077: reducing learning rate of group 0 to 5.2776e-04.


 25%|██▌       | 35/138 [00:00<00:00, 166.32it/s]
 38%|███▊      | 53/138 [00:00<00:00, 167.82it/s]
 51%|█████▏    | 71/138 [00:00<00:00, 170.51it/s]
 64%|██████▍   | 89/138 [00:00<00:00, 171.46it/s]
 78%|███████▊  | 107/138 [00:00<00:00, 171.37it/s]
 91%|█████████ | 125/138 [00:00<00:00, 172.43it/s]
100%|██████████| 138/138 [00:00<00:00, 170.85it/s]
100%|██████████| 40/40 [00:00<00:00, 417.16it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 13%|█▎        | 18/138 [00:00<00:00, 171.05it/s]
 26%|██▌       | 36/138 [00:00<00:00, 171.59it/s]
 39%|███▉      | 54/138 [00:00<00:00, 172.26it/s]
 52%|█████▏    | 72/138 [00:00<00:00, 170.72it/s]
 65%|██████▌   | 90/138 [00:00<00:00, 168.81it/s]
 78%|███████▊  | 107/138 [00:00<00:00, 168.87it/s]
100%|██████████| 138/138 [00:00<00:00, 169.60it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 395.83it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 17/138 [00:00<00:00, 164.62it/s]
 25%|██▍       | 34/138 [00:

[2m[36m(func pid=7788)[0m Epoch 00087: reducing learning rate of group 0 to 2.6388e-04.


 12%|█▏        | 17/138 [00:00<00:00, 166.80it/s]
 25%|██▌       | 35/138 [00:00<00:00, 169.64it/s]
 38%|███▊      | 52/138 [00:00<00:00, 168.84it/s]
 50%|█████     | 69/138 [00:00<00:00, 166.81it/s]
 63%|██████▎   | 87/138 [00:00<00:00, 169.28it/s]
 76%|███████▌  | 105/138 [00:00<00:00, 170.36it/s]
100%|██████████| 138/138 [00:00<00:00, 168.74it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 422.07it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 13%|█▎        | 18/138 [00:00<00:00, 174.59it/s]
 26%|██▌       | 36/138 [00:00<00:00, 168.74it/s]
 38%|███▊      | 53/138 [00:00<00:00, 166.64it/s]
 51%|█████     | 70/138 [00:00<00:00, 161.06it/s]
 64%|██████▍   | 88/138 [00:00<00:00, 165.33it/s]
 76%|███████▌  | 105/138 [00:00<00:00, 133.65it/s]
 89%|████████▉ | 123/138 [00:00<00:00, 144.68it/s]
100%|██████████| 138/138 [00:00<00:00, 153.50it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 420.40it/s]
  0%|          | 0/138 [00:00

[2m[36m(func pid=7788)[0m Epoch 00100: reducing learning rate of group 0 to 1.3194e-04.


 12%|█▏        | 16/138 [00:00<00:00, 148.44it/s]
 22%|██▏       | 31/138 [00:00<00:00, 148.85it/s]
 36%|███▌      | 49/138 [00:00<00:00, 158.81it/s]
 47%|████▋     | 65/138 [00:00<00:00, 153.56it/s]
 59%|█████▉    | 82/138 [00:00<00:00, 157.47it/s]
 71%|███████   | 98/138 [00:00<00:00, 151.50it/s]
 83%|████████▎ | 115/138 [00:00<00:00, 156.27it/s]
100%|██████████| 138/138 [00:00<00:00, 153.37it/s]
 22%|██▎       | 9/40 [00:00<00:00, 83.56it/s]
100%|██████████| 40/40 [00:00<00:00, 218.79it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 16/138 [00:00<00:00, 150.75it/s]
 23%|██▎       | 32/138 [00:00<00:00, 152.66it/s]
 36%|███▌      | 50/138 [00:00<00:00, 161.75it/s]
 49%|████▉     | 68/138 [00:00<00:00, 165.89it/s]
 62%|██████▏   | 86/138 [00:00<00:00, 168.95it/s]
 75%|███████▌  | 104/138 [00:00<00:00, 170.12it/s]
 88%|████████▊ | 122/138 [00:00<00:00, 170.21it/s]
100%|██████████| 138/138 [00:00<00:00, 167.25it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/

[2m[36m(func pid=7788)[0m Epoch 00110: reducing learning rate of group 0 to 6.5970e-05.


 13%|█▎        | 18/138 [00:00<00:00, 167.15it/s]
 25%|██▌       | 35/138 [00:00<00:00, 148.77it/s]
 49%|████▉     | 68/138 [00:00<00:00, 158.21it/s]
 61%|██████    | 84/138 [00:00<00:00, 151.40it/s]
 73%|███████▎  | 101/138 [00:00<00:00, 155.45it/s]
 85%|████████▍ | 117/138 [00:00<00:00, 146.40it/s]
100%|██████████| 138/138 [00:00<00:00, 149.07it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 397.86it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 10%|█         | 14/138 [00:00<00:00, 136.98it/s]
 22%|██▏       | 31/138 [00:00<00:00, 153.91it/s]
 34%|███▍      | 47/138 [00:00<00:00, 152.68it/s]
 46%|████▌     | 63/138 [00:00<00:00, 152.42it/s]
 58%|█████▊    | 80/138 [00:00<00:00, 156.64it/s]
 71%|███████   | 98/138 [00:00<00:00, 163.09it/s]
 84%|████████▍ | 116/138 [00:00<00:00, 167.52it/s]
100%|██████████| 138/138 [00:00<00:00, 162.99it/s]
100%|██████████| 40/40 [00:00<00:00, 411.44it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 13%|█▎        | 18/138 [00:

[2m[36m(func pid=7788)[0m Epoch 00116: reducing learning rate of group 0 to 3.2985e-05.


  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 17/138 [00:00<00:00, 165.17it/s]
 25%|██▍       | 34/138 [00:00<00:00, 157.14it/s]
 38%|███▊      | 52/138 [00:00<00:00, 164.90it/s]
 51%|█████     | 70/138 [00:00<00:00, 169.72it/s]
 64%|██████▍   | 88/138 [00:00<00:00, 170.41it/s]
 77%|███████▋  | 106/138 [00:00<00:00, 171.53it/s]
100%|██████████| 138/138 [00:00<00:00, 168.75it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 400.09it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 17/138 [00:00<00:00, 169.97it/s]
 25%|██▌       | 35/138 [00:00<00:00, 173.34it/s]
 38%|███▊      | 53/138 [00:00<00:00, 174.33it/s]
 51%|█████▏    | 71/138 [00:00<00:00, 174.62it/s]
 64%|██████▍   | 89/138 [00:00<00:00, 173.98it/s]
 78%|███████▊  | 107/138 [00:00<00:00, 174.98it/s]
 91%|█████████ | 125/138 [00:00<00:00, 175.37it/s]
100%|██████████| 138/138 [00:00<00:00, 174.27it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 4

[2m[36m(func pid=7788)[0m Epoch 00123: reducing learning rate of group 0 to 1.6492e-05.


 25%|██▍       | 34/138 [00:00<00:00, 157.62it/s]
 37%|███▋      | 51/138 [00:00<00:00, 160.75it/s]
 50%|█████     | 69/138 [00:00<00:00, 166.00it/s]
 75%|███████▌  | 104/138 [00:00<00:00, 169.13it/s]
 89%|████████▉ | 123/138 [00:00<00:00, 172.56it/s]
100%|██████████| 138/138 [00:00<00:00, 169.12it/s]
100%|██████████| 40/40 [00:00<00:00, 435.86it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 13%|█▎        | 18/138 [00:00<00:00, 171.93it/s]
 26%|██▌       | 36/138 [00:00<00:00, 173.38it/s]
 52%|█████▏    | 72/138 [00:00<00:00, 172.85it/s]
 65%|██████▌   | 90/138 [00:00<00:00, 168.36it/s]
 78%|███████▊  | 107/138 [00:00<00:00, 162.75it/s]
100%|██████████| 138/138 [00:00<00:00, 167.22it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 285.98it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 10%|█         | 14/138 [00:00<00:00, 137.88it/s]
 22%|██▏       | 30/138 [00:00<00:00, 147.37it/s]
 33%|███▎      | 45/138 [00:00<00:00, 147.80it/s]
 44%|████▍     | 61/138 [00:

[2m[36m(func pid=7788)[0m Epoch 00129: reducing learning rate of group 0 to 8.2462e-06.


  0%|          | 0/138 [00:00<?, ?it/s]
 26%|██▌       | 36/138 [00:00<00:00, 172.66it/s]
 39%|███▉      | 54/138 [00:00<00:00, 173.48it/s]
 52%|█████▏    | 72/138 [00:00<00:00, 166.32it/s]
 64%|██████▍   | 89/138 [00:00<00:00, 163.47it/s]
 77%|███████▋  | 106/138 [00:00<00:00, 161.18it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 363.87it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 10%|█         | 14/138 [00:00<00:00, 139.54it/s]
 22%|██▏       | 31/138 [00:00<00:00, 152.36it/s]
 34%|███▍      | 47/138 [00:00<00:00, 150.61it/s]
 46%|████▌     | 63/138 [00:00<00:00, 150.52it/s]
 58%|█████▊    | 80/138 [00:00<00:00, 152.45it/s]
 81%|████████  | 112/138 [00:00<00:00, 148.25it/s]
 92%|█████████▏| 127/138 [00:00<00:00, 136.95it/s]
100%|██████████| 138/138 [00:00<00:00, 144.63it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 314.86it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 11%|█         | 15/138 [00:00<00:00, 146.99it/s]


[2m[36m(func pid=7788)[0m Epoch 00135: reducing learning rate of group 0 to 4.1231e-06.


 10%|█         | 14/138 [00:00<00:00, 137.07it/s]
 22%|██▏       | 30/138 [00:00<00:00, 144.69it/s]
 33%|███▎      | 46/138 [00:00<00:00, 146.46it/s]
 44%|████▍     | 61/138 [00:00<00:00, 139.09it/s]
 56%|█████▌    | 77/138 [00:00<00:00, 143.74it/s]
 67%|██████▋   | 92/138 [00:00<00:00, 141.02it/s]
 78%|███████▊  | 107/138 [00:00<00:00, 139.29it/s]
 91%|█████████ | 125/138 [00:00<00:00, 149.09it/s]
100%|██████████| 138/138 [00:00<00:00, 145.37it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 387.59it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
  9%|▊         | 12/138 [00:00<00:01, 115.50it/s]
 20%|█▉        | 27/138 [00:00<00:00, 130.33it/s]
 33%|███▎      | 45/138 [00:00<00:00, 150.03it/s]
 46%|████▌     | 63/138 [00:00<00:00, 160.25it/s]
 59%|█████▊    | 81/138 [00:00<00:00, 165.66it/s]
 72%|███████▏  | 99/138 [00:00<00:00, 168.32it/s]
 85%|████████▍ | 117/138 [00:00<00:00, 171.50it/s]
100%|██████████| 138/138 [00:00<00:00, 163.91it/s]
  0%|          | 

[2m[36m(func pid=7788)[0m Epoch 00141: reducing learning rate of group 0 to 2.0616e-06.


  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 17/138 [00:00<00:00, 165.13it/s]
 25%|██▌       | 35/138 [00:00<00:00, 172.83it/s]
 38%|███▊      | 53/138 [00:00<00:00, 174.15it/s]
 65%|██████▌   | 90/138 [00:00<00:00, 175.99it/s]
 79%|███████▉  | 109/138 [00:00<00:00, 177.83it/s]
 92%|█████████▏| 127/138 [00:00<00:00, 176.33it/s]
100%|██████████| 138/138 [00:00<00:00, 173.79it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 413.66it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 26%|██▌       | 36/138 [00:00<00:00, 175.91it/s]
 39%|███▉      | 54/138 [00:00<00:00, 177.66it/s]
 52%|█████▏    | 72/138 [00:00<00:00, 177.47it/s]
 66%|██████▌   | 91/138 [00:00<00:00, 178.70it/s]
 79%|███████▉  | 109/138 [00:00<00:00, 178.60it/s]
 92%|█████████▏| 127/138 [00:00<00:00, 176.04it/s]
100%|██████████| 138/138 [00:00<00:00, 176.02it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 416.04it/s]
  0%|          | 0/138 [00:00<?, ?it/s

[2m[36m(func pid=7788)[0m Epoch 00147: reducing learning rate of group 0 to 1.0308e-06.


 13%|█▎        | 18/138 [00:00<00:00, 174.03it/s]
 26%|██▌       | 36/138 [00:00<00:00, 174.82it/s]
 39%|███▉      | 54/138 [00:00<00:00, 173.61it/s]
 52%|█████▏    | 72/138 [00:00<00:00, 173.32it/s]
 65%|██████▌   | 90/138 [00:00<00:00, 174.45it/s]
 79%|███████▉  | 109/138 [00:00<00:00, 176.82it/s]
100%|██████████| 138/138 [00:00<00:00, 173.07it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 426.39it/s]
  0%|          | 0/138 [00:00<?, ?it/s]
 12%|█▏        | 16/138 [00:00<00:00, 156.83it/s]
 24%|██▍       | 33/138 [00:00<00:00, 158.88it/s]
 36%|███▌      | 50/138 [00:00<00:00, 161.59it/s]
 50%|█████     | 69/138 [00:00<00:00, 168.72it/s]
 63%|██████▎   | 87/138 [00:00<00:00, 172.01it/s]
 76%|███████▌  | 105/138 [00:00<00:00, 174.59it/s]
 89%|████████▉ | 123/138 [00:00<00:00, 175.32it/s]
100%|██████████| 138/138 [00:00<00:00, 171.66it/s]
  0%|          | 0/40 [00:00<?, ?it/s]
100%|██████████| 40/40 [00:00<00:00, 425.71it/s]
  0%|          | 0/138 [00:00

[2m[36m(func pid=22192)[0m Epoch 00014: reducing learning rate of group 0 to 1.2408e-02.


  5%|▌         | 15/276 [00:00<00:01, 148.83it/s]
 11%|█         | 31/276 [00:00<00:01, 150.98it/s]
 17%|█▋        | 47/276 [00:00<00:01, 152.59it/s]
 23%|██▎       | 63/276 [00:00<00:01, 154.81it/s]
 29%|██▊       | 79/276 [00:00<00:01, 155.67it/s]
 34%|███▍      | 95/276 [00:00<00:01, 152.06it/s]
 40%|████      | 111/276 [00:00<00:01, 147.56it/s]
 46%|████▌     | 127/276 [00:00<00:00, 149.64it/s]
 52%|█████▏    | 144/276 [00:00<00:00, 153.37it/s]
 58%|█████▊    | 161/276 [00:01<00:00, 155.53it/s]
 64%|██████▍   | 178/276 [00:01<00:00, 158.50it/s]
 77%|███████▋  | 212/276 [00:01<00:00, 159.10it/s]
 83%|████████▎ | 229/276 [00:01<00:00, 160.30it/s]
 89%|████████▉ | 246/276 [00:01<00:00, 160.81it/s]
  0%|          | 0/79 [00:00<?, ?it/s]
100%|██████████| 79/79 [00:00<00:00, 585.76it/s]
  6%|▌         | 16/276 [00:00<00:01, 157.54it/s]
 12%|█▏        | 32/276 [00:00<00:01, 155.86it/s]
 17%|█▋        | 48/276 [00:00<00:01, 143.09it/s]
 23%|██▎       | 63/276 [00:00<00:01, 136.89it/s]
 28%

[2m[36m(func pid=22192)[0m Epoch 00038: reducing learning rate of group 0 to 6.2040e-03.


 12%|█▏        | 34/276 [00:00<00:01, 166.82it/s]
 18%|█▊        | 51/276 [00:00<00:01, 152.98it/s]
 30%|███       | 83/276 [00:00<00:01, 148.23it/s]
 36%|███▌      | 98/276 [00:00<00:01, 145.63it/s]
 41%|████      | 113/276 [00:00<00:01, 146.93it/s]
 47%|████▋     | 129/276 [00:00<00:00, 149.65it/s]
 53%|█████▎    | 146/276 [00:00<00:00, 154.93it/s]
 59%|█████▉    | 163/276 [00:01<00:00, 157.98it/s]
 65%|██████▍   | 179/276 [00:01<00:00, 157.21it/s]
 71%|███████   | 196/276 [00:01<00:00, 160.06it/s]
 77%|███████▋  | 213/276 [00:01<00:00, 161.46it/s]
 83%|████████▎ | 230/276 [00:01<00:00, 152.99it/s]
 89%|████████▉ | 246/276 [00:01<00:00, 150.12it/s]
 73%|███████▎  | 58/79 [00:00<00:00, 578.25it/s]
100%|██████████| 79/79 [00:00<00:00, 576.70it/s]
  0%|          | 0/276 [00:00<?, ?it/s]
  6%|▌         | 16/276 [00:00<00:01, 152.53it/s]
 12%|█▏        | 32/276 [00:00<00:01, 153.17it/s]
 17%|█▋        | 48/276 [00:00<00:01, 131.74it/s]
 22%|██▏       | 62/276 [00:00<00:01, 131.36it/s]
 28