In [11]:
import pandas as pd
import numpy as np
import os
import shutil
from tqdm import tqdm
import argparse
import tensorflow as tf
from tqdm import tqdm
from PIL import Image
import io
import json
import time
import sys
from shufflenet import get_shufflenet

In [2]:
data_dir = 'tiny-imagenet-200'
annotations_file = os.path.join(data_dir, 'val', 'val_annotations.txt')
val_data = pd.read_csv(annotations_file, sep='\t', header=None)
val_data.drop([2, 3, 4, 5], axis=1, inplace=True)  # drop bounding boxes info
val_data.columns = ['img_name', 'img_class']
unique_classes = val_data.img_class.unique()

In [3]:
# create new folders to move the data into
validation_dir = os.path.join(data_dir, 'validation')
os.mkdir(validation_dir)
for name in unique_classes:
    os.mkdir(os.path.join(validation_dir, name))

In [4]:
# loop over all classes
for name in tqdm(unique_classes):
    # choose images only from a specific class
    class_images = val_data.loc[val_data.img_class == name, 'img_name'].values
    # copy these images to a new folder
    for img in class_images:
        shutil.copyfile(
            os.path.join(data_dir, 'val', 'images', img),
            os.path.join(validation_dir, name, img)
        )

100%|██████████| 200/200 [00:01<00:00, 170.71it/s]


In [5]:
# create new folders to move data into
training_dir = os.path.join(data_dir, 'training')
os.mkdir(training_dir)
for name in unique_classes:
    os.mkdir(os.path.join(training_dir, name))

In [6]:
# loop over all classes
for name in tqdm(unique_classes):
    # choose images only from a specific class
    class_images = os.listdir(os.path.join(data_dir, 'train', name, 'images'))
    # copy these images to a new folder
    for img in class_images:
        shutil.copyfile(
            os.path.join(data_dir, 'train', name, 'images', img),
            os.path.join(training_dir, name, img)
        )

100%|██████████| 200/200 [00:09<00:00, 21.90it/s]


In [7]:
def main():
    encoder = create_encoder(train_dir)
    # now you can get a folder's name from a class index

    np.save(os.path.join(save_dir, 'class_encoder.npy'), encoder)
    convert(train_dir, encoder, os.path.join(save_dir, 'train.tfrecords'))
    convert(val_dir, encoder, os.path.join(save_dir, 'val.tfrecords'))

    print('\nCreated two tfrecords files:')
    print(os.path.join(save_dir, 'train.tfrecords'))
    print(os.path.join(save_dir, 'val.tfrecords'))

In [8]:
def _bytes_feature(value):
    return tf.train.Feature(bytes_list=tf.train.BytesList(value=[value]))

def _int64_feature(value):
    return tf.train.Feature(int64_list=tf.train.Int64List(value=[value]))


# here you can also just use `return array.tostring()`
# but it will make tfrecords files a lot larger and
# you will need to change the input pipeline
def to_bytes(array):
    image = Image.fromarray(array)
    tmp = io.BytesIO()
    image.save(tmp, format='jpeg')
    return tmp.getvalue()

def convert(folder, encoder, tfrecords_filename):
    """Convert a folder with directories of images to tfrecords format.
    Arguments:
        folder: A path to a folder where directories with images are.
        encoder: A dict, folder_name -> integer.
        tfrecords_filename: A path where to save tfrecords file.
    """
    images_metadata = collect_metadata(folder, encoder)
    writer = tf.python_io.TFRecordWriter(tfrecords_filename)

    for _, row in tqdm(images_metadata.iterrows()):

        file_path = os.path.join(folder, row.img_path)

        # read an image
        image = Image.open(file_path)

        # convert to an array
        array = np.asarray(image, dtype='uint8')

        # some images are grayscale
        if array.shape[-1] != 3:
            array = np.stack([array, array, array], axis=2)

        # get class of the image
        target = int(row.class_number)

        feature = {
            'image': _bytes_feature(to_bytes(array)),
            'target': _int64_feature(target),
        }

        example = tf.train.Example(features=tf.train.Features(feature=feature))
        writer.write(example.SerializeToString())

    writer.close()

def create_encoder(folder):
    """Encode directories in the folder with integer values.
    Values are in the range 0..(n_directories - 1).
    Arguments:
        folder: A path to a folder where directories with images are.
            Each directory - separate class.
    Returns:
        A dict.
    """
    classes = os.listdir(folder)
    encoder = {n: i for i, n in enumerate(classes)}
    return encoder


def collect_metadata(folder, encoder):
    """Collect paths to images. Collect their classes.
    All paths must be with respect to 'folder'.
    Arguments:
        folder: A path to a folder where directories with images are.
            Each directory - separate class.
        encoder: A dict, folder_name -> integer.
    Returns:
        A pandas dataframe.
    """

    subdirs = list(os.walk(folder))[1:]
    metadata = []

    for dir_path, _, files in subdirs:
        dir_name = dir_path.split('/')[-1]
        for file_name in files:
            image_metadata = [dir_name, os.path.join(dir_name, file_name)]
            metadata.append(image_metadata)

    M = pd.DataFrame(metadata)
    M.columns = ['class_name', 'img_path']

    # encode folder names by integers
    M['class_number'] = M.class_name.apply(lambda x: encoder[x])

    # shuffle the dataframe
    M = M.sample(frac=1).reset_index(drop=True)
    return M

In [9]:
train_dir = 'tiny-imagenet-200/training'
val_dir = 'tiny-imagenet-200/validation'
save_dir = 'tiny-imagenet-200'

In [10]:
main()

100000it [02:08, 778.20it/s]
10000it [00:12, 809.85it/s]


Created two tfrecords files:
tiny-imagenet-200/train.tfrecords
tiny-imagenet-200/val.tfrecords





In [18]:
run = 0
reset = 'store_true'
train_tfrecords = 'tiny-imagenet-200/train.tfrecords'
val_tfrecords = 'tiny-imagenet-200/val.tfrecords'
num_epochs = 35
batch_size = 200
steps_per_epoch = 500
validation_steps = 50
lr_patience = 4
lr_threshold = 0.01
patience = 10
threshold = 0.01
initial_lr = 1e-1
weight_decay = 5e-3
groups = 3
dropout = 0.5
complexity_scale_factor = 0.75

In [19]:
class Foo:
    def __init__(self,
                run = 0,
                reset = True,
                train_tfrecords = 'tiny-imagenet-200/train.tfrecords',
                val_tfrecords = 'tiny-imagenet-200/val.tfrecords',
                num_epochs = 50,
                batch_size = 200,
                steps_per_epoch = 500,
                validation_steps = 50,
                lr_patience = 4,
                lr_threshold = 0.01,
                patience = 10,
                threshold = 0.01,
                initial_lr = 1e-1,
                weight_decay = 5e-3,
                groups = 3,
                dropout = 0.5,
                complexity_scale_factor = 0.75):
        self.run = run
        self.reset = reset
        self.train_tfrecords = train_tfrecords
        self.val_tfrecords = val_tfrecords
        self.num_epochs = num_epochs
        self.batch_size =batch_size
        self.steps_per_epoch = steps_per_epoch
        self.validation_steps = validation_steps
        self.lr_patience =lr_patience
        self.lr_threshold = lr_threshold
        self.patience = patience
        self.threshold = threshold
        self.initial_lr = initial_lr
        self.weight_decay = weight_decay
        self.groups = groups
        self.dropout = dropout
        self.complexity_scale_factor = complexity_scale_factor


In [20]:
FLAGS = Foo()

In [21]:
def train():

    # folders for logging and saving
    dir_to_log = os.path.join('logs', 'run' + str(FLAGS.run))
    dir_to_save = os.path.join('saved', 'run' + str(FLAGS.run))

    print('\nTraining logs and summaries will be in', dir_to_log)
    print('Saved model will be in', dir_to_save, '\n')

    # create these folders
    if FLAGS.reset and os.path.exists(dir_to_log):
        shutil.rmtree(dir_to_log)
    if FLAGS.reset and os.path.exists(dir_to_save):
        shutil.rmtree(dir_to_save)
    if not os.path.exists(dir_to_log):
        os.makedirs(dir_to_log)
    if not os.path.exists(dir_to_save):
        os.makedirs(dir_to_save)

    # files with losses and config
    training_info_file = os.path.join(dir_to_log, 'training_info.txt')
    model_config_file = os.path.join(dir_to_log, 'model_config.txt')
    print('Training/validation evaluations will be in', training_info_file)
    print('Model config will be in', model_config_file, '\n')

    # create the graph and start a session
    graph, ops = get_shufflenet(
        FLAGS.initial_lr, FLAGS.weight_decay,
        FLAGS.groups, FLAGS.dropout,
        FLAGS.complexity_scale_factor
    )
    sess = tf.Session(graph=graph)
    writer = tf.summary.FileWriter(dir_to_log, sess.graph)
    print('\nCreated the graph and started a session!')

    # check if to continue training or start from scratch
    warm = os.path.exists(training_info_file)  # warm start
    if warm and not FLAGS.reset:
        print('Restoring previously saved model and continuing training.\n')
        initial_epoch = sum(1 for line in open(training_info_file))
        try:
            ops['saver'].restore(sess, os.path.join(dir_to_save, 'model'))
        except:
            print('\nCan\'t restore the saved model, '
                  'maybe architectures don\'t match.')
            sys.exit()
    else:
        print('Training model from scratch.\n')
        initial_epoch = 1
        sess.run(ops['init_variables'])

    # initialize data sources
    data_dict = {
        'input_pipeline/train_file:0': FLAGS.train_tfrecords,
        'input_pipeline/val_file:0': FLAGS.val_tfrecords,
        'input_pipeline/batch_size:0': FLAGS.batch_size
    }
    sess.run(ops['init_data'], data_dict)

    losses = []  # training info will be collected here
    training_epochs = range(
        initial_epoch,
        initial_epoch + FLAGS.num_epochs
    )

    # begin training,
    # but you can interrupt training by ctrl-c,
    # your model will be saved
    try:
        for epoch in training_epochs:

            start_time = time.time()
            running_loss, running_accuracy = 0.0, 0.0
            sess.run(ops['train_init'])

            # at zeroth step also collect metadata and summaries
            run_options = tf.RunOptions(
                trace_level=tf.RunOptions.FULL_TRACE
            )
            run_metadata = tf.RunMetadata()

            # do epoch's zeroth step
            _, batch_loss, batch_accuracy, summary, grad_summary = sess.run([
                ops['optimize'], ops['log_loss'], ops['accuracy'],
                ops['summaries'], ops['grad_summaries']
            ], options=run_options, run_metadata=run_metadata)
            running_loss += batch_loss
            running_accuracy += batch_accuracy

            print('epoch', epoch)
            training_steps = tqdm(
                range(1, FLAGS.steps_per_epoch),
                initial=1, total=FLAGS.steps_per_epoch
            )

            # main training loop
            for step in training_steps:

                _, batch_loss, batch_accuracy = sess.run([
                    ops['optimize'], ops['log_loss'], ops['accuracy']
                ])
                running_loss += batch_loss
                running_accuracy += batch_accuracy

            # evaluate on the validation set
            val_loss, val_accuracy = _evaluate(
                sess, ops, FLAGS.validation_steps
            )
            train_loss = running_loss/FLAGS.steps_per_epoch
            train_accuracy = running_accuracy/FLAGS.steps_per_epoch

            # collect all losses and accuracies
            losses += [(
                epoch, train_loss, val_loss,
                train_accuracy, val_accuracy, time.time() - start_time
            )]
            writer.add_run_metadata(run_metadata, str(epoch))
            writer.add_summary(summary, epoch)
            writer.add_summary(grad_summary, epoch)
            print('loss: {0:.3f}, val_loss: {1:.3f}, '
                  'acc: {2:.3f}, val_acc: {3:.3f}, time: {4:.3f}\n'.format(*losses[-1][1:]))

            # consider a possibility of early stopping
            if _is_early_stopping(losses, FLAGS.patience, FLAGS.threshold):
                print('Early stopping!')
                break

            # consider a possibility of reducing learning rate by some factor
            _reduce_lr_on_plateau(
                sess, ops, losses,
                FLAGS.lr_patience, FLAGS.lr_threshold
            )
    except (KeyboardInterrupt, SystemExit):
        print(' Interruption detected, exiting the program...')

    print('Writing logs and saving the trained model.')
    _write_training_info(
        FLAGS, losses, warm,
        training_info_file, model_config_file
    )
    ops['saver'].save(sess, os.path.join(dir_to_save, 'model'))
    sess.close()


def _evaluate(sess, ops, validation_steps):

    val_loss, val_accuracy = 0.0, 0.0
    sess.run(ops['val_init'])

    for i in range(validation_steps):
        batch_loss, batch_accuracy = sess.run(
            [ops['log_loss'], ops['accuracy']],
            {'control/is_training:0': False}
        )
        val_loss += batch_loss
        val_accuracy += batch_accuracy

    val_loss /= validation_steps
    val_accuracy /= validation_steps
    return val_loss, val_accuracy


# it decides if training must stop
def _is_early_stopping(losses, patience=10, threshold=0.01):

    # get validation set accuracies
    accuracies = [x[4] for x in losses]

    if len(losses) > (patience + 4):
        # running average
        average = (accuracies[-(patience + 4)] +
                   accuracies[-(patience + 3)] +
                   accuracies[-(patience + 2)] +
                   accuracies[-(patience + 1)] +
                   accuracies[-patience])/5.0
        return accuracies[-1] < average + threshold
    else:
        return False


def _reduce_lr_on_plateau(
        sess, ops, losses,
        patience=10, threshold=0.01):

    # get validation set accuracies
    accuracies = [x[4] for x in losses]

    if len(losses) > (patience + 4):
        # running average
        average = (accuracies[-(patience + 4)] +
                   accuracies[-(patience + 3)] +
                   accuracies[-(patience + 2)] +
                   accuracies[-(patience + 1)] +
                   accuracies[-patience])/5.0
        if accuracies[-1] < (average + threshold):
            sess.run(ops['drop_learning_rate'])
            print('Learning rate is dropped!\n')


def _write_training_info(
        FLAGS, losses, warm,
        training_info_file, model_config_file):

    mode = 'a' if warm else 'w'
    with open(training_info_file, mode) as f:

        # if file is new then add columns
        if not warm:
            columns = ('epoch,train_loss,val_loss,'
                       'train_accuracy,val_accuracy,time\n')
            f.write(columns)

        for i in losses:
            values = ('{0},{1:.3f},{2:.3f},'
                      '{3:.3f},{4:.3f},{5:.3f}\n').format(*i)
            f.write(values)

    with open(model_config_file, mode) as f:
        FLAGS_dict = vars(FLAGS)
        # len(losses) equals to the number of passed full epochs
        FLAGS_dict['num_epochs'] = len(losses)
        json.dump(FLAGS_dict, f)
        f.write('\n')

In [22]:
old_v = tf.logging.get_verbosity()
tf.logging.set_verbosity(tf.logging.ERROR)

In [None]:
train()


Training logs and summaries will be in logs/run0
Saved model will be in saved/run0 

Training/validation evaluations will be in logs/run0/training_info.txt
Model config will be in logs/run0/model_config.txt 


Created the graph and started a session!
Training model from scratch.




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 1



  0%|          | 2/500 [00:03<31:03,  3.74s/it][A
  1%|          | 3/500 [00:04<22:30,  2.72s/it][A
  1%|          | 4/500 [00:04<16:31,  2.00s/it][A
  1%|          | 5/500 [00:04<12:21,  1.50s/it][A
  1%|          | 6/500 [00:05<09:26,  1.15s/it][A
  1%|▏         | 7/500 [00:05<07:24,  1.11it/s][A
  2%|▏         | 8/500 [00:05<05:58,  1.37it/s][A
  2%|▏         | 9/500 [00:06<04:59,  1.64it/s][A
  2%|▏         | 10/500 [00:06<04:19,  1.89it/s][A
  2%|▏         | 11/500 [00:06<03:50,  2.13it/s][A
  2%|▏         | 12/500 [00:07<03:29,  2.33it/s][A
  3%|▎         | 13/500 [00:07<03:15,  2.50it/s][A
  3%|▎         | 14/500 [00:07<03:04,  2.63it/s][A
  3%|▎         | 15/500 [00:08<02:57,  2.73it/s][A
  3%|▎         | 16/500 [00:08<02:52,  2.81it/s][A
  3%|▎         | 17/500 [00:08<02:48,  2.87it/s][A
  4%|▎         | 18/500 [00:09<02:45,  2.91it/s][A
  4%|▍         | 19/500 [00:09<02:42,  2.95it/s][A
  4%|▍         | 20/500 [00:09<02:42,  2.96it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:46<01:02,  3.01it/s][A
 63%|██████▎   | 313/500 [01:46<01:02,  3.01it/s][A
 63%|██████▎   | 314/500 [01:46<01:02,  2.99it/s][A
 63%|██████▎   | 315/500 [01:47<01:01,  3.00it/s][A
 63%|██████▎   | 316/500 [01:47<01:01,  3.00it/s][A
 63%|██████▎   | 317/500 [01:47<01:00,  3.00it/s][A
 64%|██████▎   | 318/500 [01:48<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:48<01:00,  3.02it/s][A
 64%|██████▍   | 320/500 [01:48<00:59,  3.02it/s][A
 64%|██████▍   | 321/500 [01:49<00:59,  3.03it/s][A
 64%|██████▍   | 322/500 [01:49<00:58,  3.04it/s][A
 65%|██████▍   | 323/500 [01:49<00:58,  3.04it/s][A
 65%|██████▍   | 324/500 [01:50<00:57,  3.04it/s][A
 65%|██████▌   | 325/500 [01:50<00:57,  3.02it/s][A
 65%|██████▌   | 326/500 [01:50<00:57,  3.01it/s][A
 65%|██████▌   | 327/500 [01:51<00:57,  3.01it/s][A
 66%|██████▌   | 328/500 [01:51<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:51<00:57,  3.00it/s][A
 66%|██████▌   | 330/500 [01:52<00:56,  3.00it

loss: 4.847, val_loss: 4.492, acc: 0.056, val_acc: 0.078, time: 184.688




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 2



  0%|          | 2/500 [00:00<02:48,  2.96it/s][A
  1%|          | 3/500 [00:00<02:46,  2.98it/s][A
  1%|          | 4/500 [00:00<02:45,  3.01it/s][A
  1%|          | 5/500 [00:01<02:44,  3.01it/s][A
  1%|          | 6/500 [00:01<02:43,  3.02it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.03it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.02it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.01it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.01it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 315/500 [01:43<01:00,  3.04it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.04it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.04it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.02it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.02it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.00it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 323/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.00it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.00it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.00it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.01it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.01it

loss: 4.193, val_loss: 4.009, acc: 0.103, val_acc: 0.136, time: 176.798




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 3



  0%|          | 2/500 [00:00<02:42,  3.06it/s][A
  1%|          | 3/500 [00:00<02:42,  3.05it/s][A
  1%|          | 4/500 [00:00<02:44,  3.02it/s][A
  1%|          | 5/500 [00:01<02:44,  3.00it/s][A
  1%|          | 6/500 [00:01<02:44,  3.01it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.01it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.02it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.02it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.03it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.03it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.03it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.03it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 315/500 [01:43<01:00,  3.04it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.04it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.04it/s][A
 64%|██████▎   | 318/500 [01:44<00:59,  3.04it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 321/500 [01:45<00:58,  3.03it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.04it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.05it/s][A
 66%|██████▌   | 330/500 [01:48<00:55,  3.04it

loss: 4.053, val_loss: 3.879, acc: 0.122, val_acc: 0.148, time: 176.911




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 4



  0%|          | 2/500 [00:00<02:43,  3.04it/s][A
  1%|          | 3/500 [00:00<02:44,  3.03it/s][A
  1%|          | 4/500 [00:00<02:44,  3.02it/s][A
  1%|          | 5/500 [00:01<02:44,  3.01it/s][A
  1%|          | 6/500 [00:01<02:44,  3.01it/s][A
  1%|▏         | 7/500 [00:01<02:44,  3.00it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.00it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.00it/s][A
  2%|▏         | 10/500 [00:02<02:43,  3.00it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.01it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.01it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.00it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.02it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.02it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.01it/s][A
 64%|██████▍   | 320/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.00it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.00it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.01it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.02it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.02it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.02it

loss: 3.987, val_loss: 3.741, acc: 0.129, val_acc: 0.175, time: 177.025




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 5



  0%|          | 2/500 [00:00<02:44,  3.03it/s][A
  1%|          | 3/500 [00:00<02:43,  3.03it/s][A
  1%|          | 4/500 [00:00<02:44,  3.01it/s][A
  1%|          | 5/500 [00:01<02:44,  3.01it/s][A
  1%|          | 6/500 [00:01<02:43,  3.02it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.02it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.03it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.03it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.02it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.00it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:40,  3.01it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.01it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.00it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  2.99it/s][A
 64%|██████▍   | 320/500 [01:45<01:00,  2.99it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  2.99it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.01it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  2.98it/s][A
 65%|██████▌   | 326/500 [01:47<00:58,  2.98it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  2.99it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.01it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.02it

loss: 3.947, val_loss: 3.777, acc: 0.136, val_acc: 0.164, time: 177.067




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 6



  0%|          | 2/500 [00:00<02:42,  3.07it/s][A
  1%|          | 3/500 [00:00<02:42,  3.06it/s][A
  1%|          | 4/500 [00:00<02:42,  3.05it/s][A
  1%|          | 5/500 [00:01<02:42,  3.04it/s][A
  1%|          | 6/500 [00:01<02:42,  3.04it/s][A
  1%|▏         | 7/500 [00:01<02:41,  3.06it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.05it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.05it/s][A
  2%|▏         | 10/500 [00:02<02:40,  3.04it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.04it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:39,  3.04it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.03it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.03it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.03it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.01it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:01,  3.04it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 315/500 [01:43<01:00,  3.04it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.04it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.04it/s][A
 64%|██████▎   | 318/500 [01:44<00:59,  3.04it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.02it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.00it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.01it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.01it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.00it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.00it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.00it

loss: 3.923, val_loss: 3.734, acc: 0.140, val_acc: 0.161, time: 177.127




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 7



  0%|          | 2/500 [00:00<02:40,  3.10it/s][A
  1%|          | 3/500 [00:00<02:41,  3.07it/s][A
  1%|          | 4/500 [00:00<02:42,  3.06it/s][A
  1%|          | 5/500 [00:01<02:43,  3.03it/s][A
  1%|          | 6/500 [00:01<02:44,  3.01it/s][A
  1%|▏         | 7/500 [00:01<02:44,  3.00it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.00it/s][A
  2%|▏         | 10/500 [00:02<02:43,  3.00it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.00it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.01it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.02it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.01it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.03it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.03it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.03it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.00it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.01it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.00it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.01it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.00it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  2.99it

loss: 3.901, val_loss: 3.708, acc: 0.143, val_acc: 0.176, time: 176.962




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 8



  0%|          | 2/500 [00:00<02:40,  3.10it/s][A
  1%|          | 3/500 [00:00<02:41,  3.08it/s][A
  1%|          | 4/500 [00:00<02:42,  3.06it/s][A
  1%|          | 5/500 [00:01<02:42,  3.04it/s][A
  1%|          | 6/500 [00:01<02:42,  3.04it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.03it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 10/500 [00:02<02:40,  3.05it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.05it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 14/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 15/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 16/500 [00:04<02:38,  3.05it/s][A
  3%|▎         | 17/500 [00:05<02:38,  3.05it/s][A
  4%|▎         | 18/500 [00:05<02:37,  3.05it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.04it/s][A
  4%|▍         | 20/500 [00:06<02:37,  3.04it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.03it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.03it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.04it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.04it/s][A
 64%|██████▎   | 318/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.01it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.00it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.00it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.01it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.01it

loss: 3.890, val_loss: 3.731, acc: 0.147, val_acc: 0.169, time: 177.040




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 9



  0%|          | 2/500 [00:00<02:42,  3.07it/s][A
  1%|          | 3/500 [00:00<02:43,  3.04it/s][A
  1%|          | 4/500 [00:00<02:43,  3.03it/s][A
  1%|          | 5/500 [00:01<02:43,  3.03it/s][A
  1%|          | 6/500 [00:01<02:43,  3.03it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.02it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.03it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.00it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.00it/s][A
  3%|▎         | 13/500 [00:03<02:42,  3.01it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.02it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.01it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.01it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.01it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.00it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.00it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.01it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.02it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 321/500 [01:46<00:58,  3.05it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.06it/s][A
 65%|██████▍   | 323/500 [01:46<00:57,  3.05it/s][A
 65%|██████▍   | 324/500 [01:47<00:57,  3.07it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.06it/s][A
 65%|██████▌   | 326/500 [01:47<00:56,  3.07it/s][A
 65%|██████▌   | 327/500 [01:48<00:56,  3.06it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.06it/s][A
 66%|██████▌   | 329/500 [01:48<00:55,  3.06it/s][A
 66%|██████▌   | 330/500 [01:49<00:55,  3.06it

loss: 3.877, val_loss: 3.692, acc: 0.148, val_acc: 0.171, time: 177.124




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 10



  0%|          | 2/500 [00:00<02:41,  3.08it/s][A
  1%|          | 3/500 [00:00<02:42,  3.06it/s][A
  1%|          | 4/500 [00:00<02:42,  3.05it/s][A
  1%|          | 5/500 [00:01<02:42,  3.04it/s][A
  1%|          | 6/500 [00:01<02:42,  3.04it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.02it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.02it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.03it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.03it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.02it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.03it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.03it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.01it/s][A
 63%|██████▎   | 314/500 [01:43<01:02,  3.00it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.00it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.01it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.01it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.00it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.00it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  2.99it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  2.99it/s][A
 66%|██████▌   | 329/500 [01:48<00:57,  2.98it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.00it

loss: 3.871, val_loss: 3.626, acc: 0.150, val_acc: 0.190, time: 176.953




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 11



  0%|          | 2/500 [00:00<02:41,  3.08it/s][A
  1%|          | 3/500 [00:00<02:42,  3.06it/s][A
  1%|          | 4/500 [00:00<02:42,  3.06it/s][A
  1%|          | 5/500 [00:01<02:42,  3.06it/s][A
  1%|          | 6/500 [00:01<02:42,  3.05it/s][A
  1%|▏         | 7/500 [00:01<02:41,  3.04it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.03it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.04it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.04it/s][A
  3%|▎         | 15/500 [00:04<02:39,  3.03it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.01it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.01it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 20/500 [00:06<02:40,  3.00it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:01,  3.04it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.03it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.03it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.03it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 321/500 [01:45<00:58,  3.03it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.00it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 326/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.01it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.01it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.02it

loss: 3.861, val_loss: 3.707, acc: 0.151, val_acc: 0.172, time: 177.088

Learning rate is dropped!




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 12



  0%|          | 2/500 [00:00<02:42,  3.06it/s][A
  1%|          | 3/500 [00:00<02:43,  3.04it/s][A
  1%|          | 4/500 [00:00<02:43,  3.04it/s][A
  1%|          | 5/500 [00:01<02:43,  3.03it/s][A
  1%|          | 6/500 [00:01<02:43,  3.03it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.03it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.03it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.03it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.02it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.04it/s][A
  3%|▎         | 15/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 16/500 [00:04<02:39,  3.03it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.03it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.03it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 20/500 [00:06<02:40,  3.00it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.01it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  2.99it/s][A
 63%|██████▎   | 314/500 [01:43<01:02,  2.97it/s][A
 63%|██████▎   | 315/500 [01:43<01:02,  2.98it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  2.99it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.00it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.01it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.02it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.01it

loss: 3.295, val_loss: 2.943, acc: 0.242, val_acc: 0.316, time: 177.208




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 13



  0%|          | 2/500 [00:00<02:40,  3.10it/s][A
  1%|          | 3/500 [00:00<02:40,  3.09it/s][A
  1%|          | 4/500 [00:00<02:40,  3.09it/s][A
  1%|          | 5/500 [00:01<02:41,  3.07it/s][A
  1%|          | 6/500 [00:01<02:41,  3.06it/s][A
  1%|▏         | 7/500 [00:01<02:41,  3.05it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.05it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.05it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.04it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 14/500 [00:04<02:39,  3.05it/s][A
  3%|▎         | 15/500 [00:04<02:38,  3.05it/s][A
  3%|▎         | 16/500 [00:04<02:38,  3.05it/s][A
  3%|▎         | 17/500 [00:05<02:38,  3.05it/s][A
  4%|▎         | 18/500 [00:05<02:38,  3.03it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.03it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.04it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:01,  3.04it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 315/500 [01:43<01:00,  3.05it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.06it/s][A
 63%|██████▎   | 317/500 [01:44<00:59,  3.07it/s][A
 64%|██████▎   | 318/500 [01:44<00:59,  3.07it/s][A
 64%|██████▍   | 319/500 [01:45<00:58,  3.07it/s][A
 64%|██████▍   | 320/500 [01:45<00:58,  3.06it/s][A
 64%|██████▍   | 321/500 [01:45<00:58,  3.05it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.06it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.04it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.03it

loss: 3.078, val_loss: 2.823, acc: 0.283, val_acc: 0.338, time: 176.975




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 14



  0%|          | 2/500 [00:00<02:44,  3.04it/s][A
  1%|          | 3/500 [00:00<02:44,  3.02it/s][A
  1%|          | 4/500 [00:00<02:44,  3.02it/s][A
  1%|          | 5/500 [00:01<02:43,  3.03it/s][A
  1%|          | 6/500 [00:01<02:43,  3.02it/s][A
  1%|▏         | 7/500 [00:01<02:44,  3.00it/s][A
  2%|▏         | 8/500 [00:02<02:44,  3.00it/s][A
  2%|▏         | 9/500 [00:02<02:43,  2.99it/s][A
  2%|▏         | 10/500 [00:02<02:43,  3.00it/s][A
  2%|▏         | 11/500 [00:03<02:43,  3.00it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.01it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 16/500 [00:05<02:42,  2.97it/s][A
  3%|▎         | 17/500 [00:05<02:41,  2.99it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.00it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.01it/s][A
 63%|██████▎   | 314/500 [01:43<01:02,  3.00it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.00it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.00it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.00it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.01it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.00it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.00it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.02it

loss: 3.002, val_loss: 2.783, acc: 0.299, val_acc: 0.347, time: 176.988




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 15



  0%|          | 2/500 [00:00<02:44,  3.03it/s][A
  1%|          | 3/500 [00:00<02:45,  3.01it/s][A
  1%|          | 4/500 [00:00<02:44,  3.02it/s][A
  1%|          | 5/500 [00:01<02:44,  3.01it/s][A
  1%|          | 6/500 [00:01<02:44,  3.01it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.01it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.03it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.00it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.01it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.00it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  2.99it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.00it/s][A
 63%|██████▎   | 317/500 [01:44<01:01,  3.00it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.00it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.01it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.01it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.02it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.00it

loss: 2.943, val_loss: 2.740, acc: 0.312, val_acc: 0.355, time: 177.116




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 16



  0%|          | 2/500 [00:00<02:42,  3.07it/s][A
  1%|          | 3/500 [00:00<02:42,  3.06it/s][A
  1%|          | 4/500 [00:00<02:42,  3.06it/s][A
  1%|          | 5/500 [00:01<02:42,  3.05it/s][A
  1%|          | 6/500 [00:01<02:42,  3.03it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.03it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.00it/s][A
  2%|▏         | 10/500 [00:02<02:43,  3.00it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.00it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.00it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.01it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:40,  3.01it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.03it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.03it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.00it/s][A
 63%|██████▎   | 317/500 [01:44<01:01,  3.00it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.00it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.00it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.01it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.01it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.01it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.02it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.03it

loss: 2.898, val_loss: 2.720, acc: 0.321, val_acc: 0.359, time: 177.182




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 17



  0%|          | 2/500 [00:00<02:41,  3.08it/s][A
  1%|          | 3/500 [00:00<02:42,  3.06it/s][A
  1%|          | 4/500 [00:00<02:41,  3.06it/s][A
  1%|          | 5/500 [00:01<02:42,  3.05it/s][A
  1%|          | 6/500 [00:01<02:42,  3.05it/s][A
  1%|▏         | 7/500 [00:01<02:41,  3.05it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:43,  3.00it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.01it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.00it/s][A
  3%|▎         | 13/500 [00:03<02:42,  3.00it/s][A
  3%|▎         | 14/500 [00:04<02:42,  3.00it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.00it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 315/500 [01:44<01:00,  3.03it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.05it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.05it/s][A
 64%|██████▎   | 318/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.03it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 326/500 [01:47<00:58,  2.99it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  2.99it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:48<00:57,  2.99it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.00it

loss: 2.856, val_loss: 2.676, acc: 0.327, val_acc: 0.363, time: 177.110




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 18



  0%|          | 2/500 [00:00<02:42,  3.06it/s][A
  1%|          | 3/500 [00:00<02:42,  3.05it/s][A
  1%|          | 4/500 [00:00<02:42,  3.05it/s][A
  1%|          | 5/500 [00:01<02:42,  3.05it/s][A
  1%|          | 6/500 [00:01<02:42,  3.04it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.02it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.02it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.02it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.03it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.03it/s][A
  4%|▍         | 20/500 [00:06<02:37,  3.04it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:01,  3.03it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.02it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.02it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 321/500 [01:45<00:58,  3.04it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.04it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.03it

loss: 2.814, val_loss: 2.611, acc: 0.339, val_acc: 0.385, time: 176.913




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 19



  0%|          | 2/500 [00:00<02:45,  3.02it/s][A
  1%|          | 3/500 [00:00<02:44,  3.03it/s][A
  1%|          | 4/500 [00:00<02:43,  3.03it/s][A
  1%|          | 5/500 [00:01<02:43,  3.03it/s][A
  1%|          | 6/500 [00:01<02:43,  3.02it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.02it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.02it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.01it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.00it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 20/500 [00:06<02:40,  2.99it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.01it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.00it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.01it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.03it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.01it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.00it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.00it

loss: 2.780, val_loss: 2.609, acc: 0.341, val_acc: 0.379, time: 176.871




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 20



  0%|          | 2/500 [00:00<02:38,  3.15it/s][A
  1%|          | 3/500 [00:00<02:40,  3.10it/s][A
  1%|          | 4/500 [00:00<02:41,  3.08it/s][A
  1%|          | 5/500 [00:01<02:41,  3.06it/s][A
  1%|          | 6/500 [00:01<02:41,  3.06it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.04it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.00it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.00it/s][A
  3%|▎         | 13/500 [00:03<02:42,  3.00it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.02it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.01it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 315/500 [01:43<01:00,  3.05it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.04it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.04it/s][A
 64%|██████▎   | 318/500 [01:44<00:59,  3.04it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.01it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.01it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.01it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.00it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 329/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.00it

loss: 2.748, val_loss: 2.610, acc: 0.349, val_acc: 0.383, time: 176.995




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 21



  0%|          | 2/500 [00:00<02:42,  3.06it/s][A
  1%|          | 3/500 [00:00<02:42,  3.05it/s][A
  1%|          | 4/500 [00:00<02:42,  3.04it/s][A
  1%|          | 5/500 [00:01<02:43,  3.04it/s][A
  1%|          | 6/500 [00:01<02:42,  3.04it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.04it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.05it/s][A
  2%|▏         | 9/500 [00:02<02:40,  3.05it/s][A
  2%|▏         | 10/500 [00:02<02:40,  3.05it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.04it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:39,  3.05it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.03it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.01it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.01it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.01it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:01,  3.04it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 315/500 [01:43<01:00,  3.04it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.04it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.04it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.03it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.02it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.01it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.01it

loss: 2.729, val_loss: 2.555, acc: 0.354, val_acc: 0.400, time: 176.808




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 22



  0%|          | 2/500 [00:00<02:42,  3.07it/s][A
  1%|          | 3/500 [00:00<02:42,  3.07it/s][A
  1%|          | 4/500 [00:00<02:42,  3.05it/s][A
  1%|          | 5/500 [00:01<02:42,  3.04it/s][A
  1%|          | 6/500 [00:01<02:43,  3.02it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.01it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.00it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.01it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.02it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.02it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.03it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:47<00:57,  3.04it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.04it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 330/500 [01:49<00:55,  3.04it

loss: 2.698, val_loss: 2.554, acc: 0.359, val_acc: 0.395, time: 177.050




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 23



  0%|          | 2/500 [00:00<02:40,  3.10it/s][A
  1%|          | 3/500 [00:00<02:40,  3.09it/s][A
  1%|          | 4/500 [00:00<02:42,  3.04it/s][A
  1%|          | 5/500 [00:01<02:43,  3.03it/s][A
  1%|          | 6/500 [00:01<02:43,  3.02it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.03it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.03it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.03it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.04it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 16/500 [00:04<02:41,  2.99it/s][A
  3%|▎         | 17/500 [00:05<02:41,  2.99it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.00it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:01,  3.04it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.01it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.01it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.02it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.01it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 329/500 [01:48<00:57,  2.99it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.00it

loss: 2.682, val_loss: 2.541, acc: 0.362, val_acc: 0.399, time: 176.937




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 24



  0%|          | 2/500 [00:00<02:43,  3.04it/s][A
  1%|          | 3/500 [00:00<02:44,  3.03it/s][A
  1%|          | 4/500 [00:00<02:43,  3.04it/s][A
  1%|          | 5/500 [00:01<02:43,  3.04it/s][A
  1%|          | 6/500 [00:01<02:42,  3.04it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.04it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.05it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 14/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 15/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 16/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.03it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.03it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.01it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.01it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.01it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.02it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.03it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.04it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 329/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.00it

loss: 2.664, val_loss: 2.504, acc: 0.368, val_acc: 0.405, time: 176.962




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 25



  0%|          | 2/500 [00:00<02:45,  3.00it/s][A
  1%|          | 3/500 [00:00<02:45,  3.00it/s][A
  1%|          | 4/500 [00:01<02:45,  2.99it/s][A
  1%|          | 5/500 [00:01<02:45,  3.00it/s][A
  1%|          | 6/500 [00:01<02:44,  3.01it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.01it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 11/500 [00:03<02:43,  3.00it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.00it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 16/500 [00:04<02:39,  3.03it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.03it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.03it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.03it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.03it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 315/500 [01:43<01:00,  3.04it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.02it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.02it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.01it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 330/500 [01:48<00:55,  3.04it

loss: 2.649, val_loss: 2.515, acc: 0.369, val_acc: 0.408, time: 177.036




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 26



  0%|          | 2/500 [00:00<02:44,  3.02it/s][A
  1%|          | 3/500 [00:00<02:44,  3.02it/s][A
  1%|          | 4/500 [00:00<02:44,  3.02it/s][A
  1%|          | 5/500 [00:01<02:43,  3.03it/s][A
  1%|          | 6/500 [00:01<02:43,  3.02it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.01it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.02it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 14/500 [00:04<02:39,  3.05it/s][A
  3%|▎         | 15/500 [00:04<02:38,  3.05it/s][A
  3%|▎         | 16/500 [00:04<02:38,  3.05it/s][A
  3%|▎         | 17/500 [00:05<02:38,  3.05it/s][A
  4%|▎         | 18/500 [00:05<02:38,  3.04it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.04it/s][A
  4%|▍         | 20/500 [00:06<02:37,  3.04it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.01it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.00it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  2.98it/s][A
 63%|██████▎   | 317/500 [01:44<01:01,  2.99it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.00it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.00it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.04it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.02it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 330/500 [01:48<00:55,  3.05it

loss: 2.635, val_loss: 2.486, acc: 0.373, val_acc: 0.405, time: 176.726




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 27



  0%|          | 2/500 [00:00<02:45,  3.02it/s][A
  1%|          | 3/500 [00:00<02:44,  3.02it/s][A
  1%|          | 4/500 [00:00<02:44,  3.02it/s][A
  1%|          | 5/500 [00:01<02:43,  3.02it/s][A
  1%|          | 6/500 [00:01<02:43,  3.02it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.02it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.02it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.02it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.01it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.00it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.01it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.01it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.01it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.00it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.02it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.03it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.02it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.01it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.01it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.02it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.01it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.01it

loss: 2.621, val_loss: 2.483, acc: 0.376, val_acc: 0.409, time: 177.117




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 28



  0%|          | 2/500 [00:00<02:43,  3.05it/s][A
  1%|          | 3/500 [00:00<02:43,  3.05it/s][A
  1%|          | 4/500 [00:00<02:43,  3.04it/s][A
  1%|          | 5/500 [00:01<02:42,  3.04it/s][A
  1%|          | 6/500 [00:01<02:42,  3.05it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.04it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.04it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.00it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.01it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.00it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.00it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.03it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.05it/s][A
 64%|██████▎   | 318/500 [01:44<00:59,  3.06it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.06it/s][A
 64%|██████▍   | 320/500 [01:45<00:58,  3.06it/s][A
 64%|██████▍   | 321/500 [01:45<00:58,  3.06it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.06it/s][A
 65%|██████▍   | 323/500 [01:46<00:57,  3.06it/s][A
 65%|██████▍   | 324/500 [01:46<00:57,  3.06it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.06it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.05it/s][A
 65%|██████▌   | 327/500 [01:47<00:56,  3.06it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.06it/s][A
 66%|██████▌   | 329/500 [01:48<00:55,  3.06it/s][A
 66%|██████▌   | 330/500 [01:48<00:55,  3.05it

loss: 2.607, val_loss: 2.506, acc: 0.378, val_acc: 0.398, time: 176.909

Learning rate is dropped!




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 29



  0%|          | 2/500 [00:00<02:43,  3.05it/s][A
  1%|          | 3/500 [00:00<02:44,  3.02it/s][A
  1%|          | 4/500 [00:00<02:44,  3.02it/s][A
  1%|          | 5/500 [00:01<02:43,  3.03it/s][A
  1%|          | 6/500 [00:01<02:43,  3.03it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.02it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.01it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.03it/s][A
  3%|▎         | 15/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 16/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 17/500 [00:05<02:38,  3.04it/s][A
  4%|▎         | 18/500 [00:05<02:38,  3.04it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.04it/s][A
  4%|▍         | 20/500 [00:06<02:37,  3.04it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.03it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.00it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.00it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.00it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.00it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.01it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.01it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.00it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.01it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.02it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.03it

loss: 2.289, val_loss: 2.193, acc: 0.450, val_acc: 0.477, time: 177.282




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 30



  0%|          | 2/500 [00:00<02:46,  2.99it/s][A
  1%|          | 3/500 [00:00<02:45,  3.01it/s][A
  1%|          | 4/500 [00:00<02:43,  3.04it/s][A
  1%|          | 5/500 [00:01<02:41,  3.06it/s][A
  1%|          | 6/500 [00:01<02:41,  3.06it/s][A
  1%|▏         | 7/500 [00:01<02:40,  3.06it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.05it/s][A
  2%|▏         | 9/500 [00:02<02:39,  3.07it/s][A
  2%|▏         | 10/500 [00:02<02:39,  3.06it/s][A
  2%|▏         | 11/500 [00:03<02:39,  3.06it/s][A
  2%|▏         | 12/500 [00:03<02:39,  3.06it/s][A
  3%|▎         | 13/500 [00:03<02:39,  3.06it/s][A
  3%|▎         | 14/500 [00:04<02:39,  3.05it/s][A
  3%|▎         | 15/500 [00:04<02:38,  3.06it/s][A
  3%|▎         | 16/500 [00:04<02:38,  3.06it/s][A
  3%|▎         | 17/500 [00:05<02:38,  3.05it/s][A
  4%|▎         | 18/500 [00:05<02:38,  3.04it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.04it/s][A
  4%|▍         | 20/500 [00:06<02:37,  3.04it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.03it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:46<00:57,  3.04it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.04it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.05it/s][A
 65%|██████▌   | 327/500 [01:47<00:56,  3.04it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.04it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.05it/s][A
 66%|██████▌   | 330/500 [01:48<00:55,  3.05it

loss: 2.176, val_loss: 2.171, acc: 0.474, val_acc: 0.481, time: 177.067




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 31



  0%|          | 2/500 [00:00<02:42,  3.06it/s][A
  1%|          | 3/500 [00:00<02:43,  3.05it/s][A
  1%|          | 4/500 [00:00<02:43,  3.03it/s][A
  1%|          | 5/500 [00:01<02:43,  3.02it/s][A
  1%|          | 6/500 [00:01<02:43,  3.02it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.02it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.00it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.00it/s][A
  3%|▎         | 13/500 [00:03<02:42,  3.00it/s][A
  3%|▎         | 14/500 [00:04<02:42,  3.00it/s][A
  3%|▎         | 15/500 [00:04<02:41,  2.99it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.00it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.01it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.01it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.03it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.02it/s][A
 63%|██████▎   | 317/500 [01:44<01:01,  3.00it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.01it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.01it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.01it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.01it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.02it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.01it

loss: 2.118, val_loss: 2.124, acc: 0.485, val_acc: 0.486, time: 177.125




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 32



  0%|          | 2/500 [00:00<02:46,  2.99it/s][A
  1%|          | 3/500 [00:00<02:46,  2.99it/s][A
  1%|          | 4/500 [00:01<02:45,  3.00it/s][A
  1%|          | 5/500 [00:01<02:45,  3.00it/s][A
  1%|          | 6/500 [00:01<02:44,  3.00it/s][A
  1%|▏         | 7/500 [00:02<02:44,  2.99it/s][A
  2%|▏         | 8/500 [00:02<02:44,  3.00it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.03it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.03it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.01it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.01it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.01it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.01it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.00it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.00it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  2.99it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.00it/s][A
 63%|██████▎   | 317/500 [01:44<01:01,  3.00it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  2.99it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.00it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.01it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.01it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.00it

loss: 2.083, val_loss: 2.115, acc: 0.495, val_acc: 0.488, time: 177.055




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 33



  0%|          | 2/500 [00:00<02:44,  3.03it/s][A
  1%|          | 3/500 [00:00<02:44,  3.02it/s][A
  1%|          | 4/500 [00:00<02:44,  3.02it/s][A
  1%|          | 5/500 [00:01<02:43,  3.02it/s][A
  1%|          | 6/500 [00:01<02:43,  3.01it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.01it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.03it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.04it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.01it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.01it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.01it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:40,  2.99it/s][A
  4%|▍         | 20/500 [00:06<02:40,  2.99it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.01it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.02it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.00it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.01it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.02it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 321/500 [01:45<00:58,  3.04it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.04it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  2.99it/s][A
 66%|██████▌   | 329/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.02it

loss: 2.059, val_loss: 2.105, acc: 0.499, val_acc: 0.493, time: 177.046




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 34



  0%|          | 2/500 [00:00<02:41,  3.08it/s][A
  1%|          | 3/500 [00:00<02:42,  3.07it/s][A
  1%|          | 4/500 [00:00<02:42,  3.06it/s][A
  1%|          | 5/500 [00:01<02:42,  3.05it/s][A
  1%|          | 6/500 [00:01<02:42,  3.04it/s][A
  1%|▏         | 7/500 [00:01<02:41,  3.05it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.05it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.03it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.03it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.03it/s][A
  3%|▎         | 16/500 [00:04<02:39,  3.03it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.04it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.01it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.00it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  2.99it/s][A
 63%|██████▎   | 314/500 [01:43<01:02,  2.99it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  2.99it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  2.99it/s][A
 63%|██████▎   | 317/500 [01:44<01:01,  3.00it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.01it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.04it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.04it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.02it

loss: 2.030, val_loss: 2.104, acc: 0.505, val_acc: 0.493, time: 177.302




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 35



  0%|          | 2/500 [00:00<02:42,  3.06it/s][A
  1%|          | 3/500 [00:00<02:42,  3.07it/s][A
  1%|          | 4/500 [00:00<02:42,  3.06it/s][A
  1%|          | 5/500 [00:01<02:42,  3.05it/s][A
  1%|          | 6/500 [00:01<02:42,  3.04it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.04it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 9/500 [00:02<02:40,  3.05it/s][A
  2%|▏         | 10/500 [00:02<02:40,  3.05it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.04it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:39,  3.05it/s][A
  3%|▎         | 14/500 [00:04<02:39,  3.05it/s][A
  3%|▎         | 15/500 [00:04<02:38,  3.06it/s][A
  3%|▎         | 16/500 [00:04<02:38,  3.05it/s][A
  3%|▎         | 17/500 [00:05<02:38,  3.04it/s][A
  4%|▎         | 18/500 [00:05<02:37,  3.06it/s][A
  4%|▍         | 19/500 [00:05<02:37,  3.05it/s][A
  4%|▍         | 20/500 [00:06<02:37,  3.05it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.03it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.02it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:44<01:01,  2.98it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.02it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:47<00:56,  3.04it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.04it/s][A
 66%|██████▌   | 329/500 [01:48<00:55,  3.05it/s][A
 66%|██████▌   | 330/500 [01:48<00:55,  3.05it

loss: 2.015, val_loss: 2.092, acc: 0.509, val_acc: 0.492, time: 176.953




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 36



  0%|          | 2/500 [00:00<02:42,  3.07it/s][A
  1%|          | 3/500 [00:00<02:42,  3.06it/s][A
  1%|          | 4/500 [00:00<02:42,  3.05it/s][A
  1%|          | 5/500 [00:01<02:43,  3.03it/s][A
  1%|          | 6/500 [00:01<02:43,  3.02it/s][A
  1%|▏         | 7/500 [00:01<02:44,  3.01it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.01it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.01it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.03it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.03it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.03it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.01it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.00it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.00it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.02it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.03it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.04it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<01:00,  2.99it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  2.99it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 323/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 326/500 [01:47<00:58,  2.99it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.01it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.02it

loss: 1.995, val_loss: 2.084, acc: 0.512, val_acc: 0.500, time: 177.180




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 37



  0%|          | 2/500 [00:00<02:40,  3.11it/s][A
  1%|          | 3/500 [00:00<02:40,  3.09it/s][A
  1%|          | 4/500 [00:00<02:40,  3.09it/s][A
  1%|          | 5/500 [00:01<02:40,  3.08it/s][A
  1%|          | 6/500 [00:01<02:40,  3.07it/s][A
  1%|▏         | 7/500 [00:01<02:41,  3.06it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.05it/s][A
  2%|▏         | 9/500 [00:02<02:40,  3.05it/s][A
  2%|▏         | 10/500 [00:02<02:40,  3.05it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.05it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.05it/s][A
  3%|▎         | 13/500 [00:03<02:39,  3.06it/s][A
  3%|▎         | 14/500 [00:04<02:38,  3.07it/s][A
  3%|▎         | 15/500 [00:04<02:38,  3.07it/s][A
  3%|▎         | 16/500 [00:04<02:37,  3.07it/s][A
  3%|▎         | 17/500 [00:05<02:37,  3.08it/s][A
  4%|▎         | 18/500 [00:05<02:36,  3.07it/s][A
  4%|▍         | 19/500 [00:05<02:36,  3.08it/s][A
  4%|▍         | 20/500 [00:06<02:36,  3.07it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:01,  3.05it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.05it/s][A
 63%|██████▎   | 315/500 [01:43<01:00,  3.03it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.03it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.01it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.00it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  2.99it/s][A
 64%|██████▍   | 320/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.00it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.01it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.01it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.01it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.02it

loss: 1.977, val_loss: 2.071, acc: 0.516, val_acc: 0.503, time: 176.913




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 38



  0%|          | 2/500 [00:00<02:44,  3.03it/s][A
  1%|          | 3/500 [00:00<02:44,  3.01it/s][A
  1%|          | 4/500 [00:00<02:44,  3.01it/s][A
  1%|          | 5/500 [00:01<02:43,  3.02it/s][A
  1%|          | 6/500 [00:01<02:43,  3.03it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.04it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.04it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 16/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 17/500 [00:05<02:41,  3.00it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.01it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.01it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.02it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.03it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.03it/s][A
 64%|██████▎   | 318/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.05it/s][A
 64%|██████▍   | 321/500 [01:46<00:58,  3.04it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.02it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.01it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:48<00:57,  2.99it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.00it

loss: 1.968, val_loss: 2.053, acc: 0.519, val_acc: 0.503, time: 177.090




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 39



  0%|          | 2/500 [00:00<02:39,  3.12it/s][A
  1%|          | 3/500 [00:00<02:40,  3.10it/s][A
  1%|          | 4/500 [00:00<02:40,  3.08it/s][A
  1%|          | 5/500 [00:01<02:41,  3.06it/s][A
  1%|          | 6/500 [00:01<02:41,  3.06it/s][A
  1%|▏         | 7/500 [00:01<02:41,  3.05it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.05it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.04it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.04it/s][A
  3%|▎         | 15/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 16/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.04it/s][A
  4%|▎         | 18/500 [00:05<02:38,  3.04it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.04it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.03it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 314/500 [01:43<01:00,  3.05it/s][A
 63%|██████▎   | 315/500 [01:44<01:00,  3.05it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.05it/s][A
 63%|██████▎   | 317/500 [01:44<00:59,  3.05it/s][A
 64%|██████▎   | 318/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 321/500 [01:46<00:58,  3.04it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.02it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.00it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.00it

loss: 1.957, val_loss: 2.071, acc: 0.521, val_acc: 0.501, time: 177.069

Learning rate is dropped!




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 40



  0%|          | 2/500 [00:00<02:43,  3.04it/s][A
  1%|          | 3/500 [00:00<02:45,  3.01it/s][A
  1%|          | 4/500 [00:01<02:45,  3.01it/s][A
  1%|          | 5/500 [00:01<02:44,  3.01it/s][A
  1%|          | 6/500 [00:01<02:44,  3.01it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.01it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.00it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.03it/s][A
  3%|▎         | 15/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 16/500 [00:04<02:39,  3.03it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.01it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.00it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.01it/s][A
 63%|██████▎   | 313/500 [01:43<01:02,  3.00it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.02it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.03it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.02it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.00it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.01it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.01it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.01it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.02it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.01it

loss: 1.861, val_loss: 2.023, acc: 0.544, val_acc: 0.507, time: 176.688




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 41



  0%|          | 2/500 [00:00<02:44,  3.03it/s][A
  1%|          | 3/500 [00:00<02:43,  3.03it/s][A
  1%|          | 4/500 [00:00<02:43,  3.03it/s][A
  1%|          | 5/500 [00:01<02:43,  3.03it/s][A
  1%|          | 6/500 [00:01<02:42,  3.04it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.02it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 9/500 [00:02<02:44,  2.99it/s][A
  2%|▏         | 10/500 [00:02<02:43,  3.00it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.00it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.01it/s][A
  3%|▎         | 13/500 [00:03<02:42,  3.00it/s][A
  3%|▎         | 14/500 [00:04<02:42,  3.00it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 16/500 [00:04<02:41,  2.99it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.00it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 19/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.03it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.03it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.04it/s][A
 64%|██████▎   | 318/500 [01:44<00:59,  3.05it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.05it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.05it/s][A
 64%|██████▍   | 321/500 [01:45<00:58,  3.06it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.07it/s][A
 65%|██████▍   | 323/500 [01:46<00:57,  3.07it/s][A
 65%|██████▍   | 324/500 [01:46<00:57,  3.06it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.06it/s][A
 65%|██████▌   | 326/500 [01:47<00:56,  3.06it/s][A
 65%|██████▌   | 327/500 [01:47<00:56,  3.05it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.05it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.05it/s][A
 66%|██████▌   | 330/500 [01:48<00:55,  3.05it

loss: 1.829, val_loss: 2.015, acc: 0.552, val_acc: 0.513, time: 176.521




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 42



  0%|          | 2/500 [00:00<02:40,  3.10it/s][A
  1%|          | 3/500 [00:00<02:41,  3.09it/s][A
  1%|          | 4/500 [00:00<02:41,  3.07it/s][A
  1%|          | 5/500 [00:01<02:41,  3.06it/s][A
  1%|          | 6/500 [00:01<02:41,  3.05it/s][A
  1%|▏         | 7/500 [00:01<02:41,  3.05it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.05it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 10/500 [00:02<02:40,  3.04it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.03it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.03it/s][A
  3%|▎         | 15/500 [00:04<02:39,  3.03it/s][A
  3%|▎         | 16/500 [00:04<02:39,  3.03it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.03it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.03it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.03it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.03it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:01,  3.03it/s][A
 63%|██████▎   | 313/500 [01:42<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 315/500 [01:43<01:00,  3.04it/s][A
 63%|██████▎   | 316/500 [01:43<01:00,  3.04it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.04it/s][A
 64%|██████▎   | 318/500 [01:44<00:59,  3.04it/s][A
 64%|██████▍   | 319/500 [01:44<00:59,  3.02it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 321/500 [01:45<00:58,  3.04it/s][A
 64%|██████▍   | 322/500 [01:45<00:58,  3.04it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.02it/s][A
 65%|██████▌   | 325/500 [01:46<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:47<00:56,  3.06it/s][A
 66%|██████▌   | 328/500 [01:47<00:56,  3.05it/s][A
 66%|██████▌   | 329/500 [01:48<00:55,  3.06it/s][A
 66%|██████▌   | 330/500 [01:48<00:55,  3.05it

loss: 1.816, val_loss: 2.010, acc: 0.555, val_acc: 0.510, time: 176.085




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 43



  0%|          | 2/500 [00:00<02:41,  3.09it/s][A
  1%|          | 3/500 [00:00<02:42,  3.07it/s][A
  1%|          | 4/500 [00:00<02:42,  3.05it/s][A
  1%|          | 5/500 [00:01<02:42,  3.05it/s][A
  1%|          | 6/500 [00:01<02:41,  3.05it/s][A
  1%|▏         | 7/500 [00:01<02:41,  3.04it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.03it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.03it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.04it/s][A
  3%|▎         | 15/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 16/500 [00:04<02:39,  3.03it/s][A
  3%|▎         | 17/500 [00:05<02:38,  3.04it/s][A
  4%|▎         | 18/500 [00:05<02:38,  3.04it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.04it/s][A
  4%|▍         | 20/500 [00:06<02:37,  3.04it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:42<01:02,  3.01it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 316/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.01it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:44<01:00,  3.01it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 322/500 [01:45<00:58,  3.02it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.02it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:46<00:57,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:47<00:56,  3.03it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.02it

loss: 1.810, val_loss: 2.006, acc: 0.557, val_acc: 0.515, time: 176.741




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 44



  0%|          | 2/500 [00:00<02:44,  3.03it/s][A
  1%|          | 3/500 [00:00<02:44,  3.02it/s][A
  1%|          | 4/500 [00:00<02:44,  3.02it/s][A
  1%|          | 5/500 [00:01<02:43,  3.03it/s][A
  1%|          | 6/500 [00:01<02:42,  3.03it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.03it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.03it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 10/500 [00:02<02:40,  3.05it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.05it/s][A
  2%|▏         | 12/500 [00:03<02:39,  3.05it/s][A
  3%|▎         | 13/500 [00:03<02:39,  3.06it/s][A
  3%|▎         | 14/500 [00:04<02:38,  3.06it/s][A
  3%|▎         | 15/500 [00:04<02:38,  3.07it/s][A
  3%|▎         | 16/500 [00:04<02:37,  3.07it/s][A
  3%|▎         | 17/500 [00:05<02:37,  3.07it/s][A
  4%|▎         | 18/500 [00:05<02:36,  3.08it/s][A
  4%|▍         | 19/500 [00:05<02:36,  3.08it/s][A
  4%|▍         | 20/500 [00:06<02:36,  3.07it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:01,  3.03it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 315/500 [01:43<01:00,  3.04it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.04it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.04it/s][A
 64%|██████▎   | 318/500 [01:44<00:59,  3.04it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.03it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.03it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.04it/s][A
 65%|██████▍   | 324/500 [01:46<00:57,  3.04it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.04it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.04it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.04it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.04it/s][A
 66%|██████▌   | 330/500 [01:48<00:55,  3.04it

loss: 1.805, val_loss: 2.000, acc: 0.557, val_acc: 0.517, time: 176.772




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 45



  0%|          | 2/500 [00:00<02:42,  3.06it/s][A
  1%|          | 3/500 [00:00<02:42,  3.05it/s][A
  1%|          | 4/500 [00:00<02:42,  3.06it/s][A
  1%|          | 5/500 [00:01<02:42,  3.05it/s][A
  1%|          | 6/500 [00:01<02:42,  3.04it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.03it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.03it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.03it/s][A
  2%|▏         | 12/500 [00:03<02:41,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.02it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.02it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.03it/s][A
  4%|▍         | 20/500 [00:06<02:38,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:03,  2.96it/s][A
 63%|██████▎   | 313/500 [01:43<01:03,  2.96it/s][A
 63%|██████▎   | 314/500 [01:43<01:02,  2.97it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  2.99it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.01it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  2.99it/s][A
 64%|██████▍   | 320/500 [01:45<01:00,  2.99it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  2.99it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.00it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.00it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.01it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.00it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.01it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.02it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 330/500 [01:48<00:55,  3.04it

loss: 1.793, val_loss: 2.004, acc: 0.560, val_acc: 0.515, time: 176.883

Learning rate is dropped!




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 46



  0%|          | 2/500 [00:00<02:41,  3.08it/s][A
  1%|          | 3/500 [00:00<02:43,  3.05it/s][A
  1%|          | 4/500 [00:00<02:43,  3.04it/s][A
  1%|          | 5/500 [00:01<02:42,  3.04it/s][A
  1%|          | 6/500 [00:01<02:42,  3.04it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.04it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.05it/s][A
  2%|▏         | 9/500 [00:02<02:40,  3.05it/s][A
  2%|▏         | 10/500 [00:02<02:40,  3.05it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.05it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 14/500 [00:04<02:40,  3.03it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.03it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 17/500 [00:05<02:40,  3.00it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.00it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.00it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.00it/s][A
 63%|██████▎   | 317/500 [01:44<01:01,  2.99it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  2.99it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.00it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.01it/s][A
 65%|██████▍   | 323/500 [01:46<00:59,  2.99it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  2.99it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 326/500 [01:47<00:58,  2.99it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  3.02it

loss: 1.788, val_loss: 1.995, acc: 0.562, val_acc: 0.519, time: 177.130

Learning rate is dropped!




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 47



  0%|          | 2/500 [00:00<02:42,  3.06it/s][A
  1%|          | 3/500 [00:00<02:43,  3.04it/s][A
  1%|          | 4/500 [00:00<02:43,  3.04it/s][A
  1%|          | 5/500 [00:01<02:42,  3.05it/s][A
  1%|          | 6/500 [00:01<02:42,  3.05it/s][A
  1%|▏         | 7/500 [00:01<02:41,  3.05it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.03it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.03it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.03it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.01it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.01it/s][A
  3%|▎         | 13/500 [00:03<02:42,  3.00it/s][A
  3%|▎         | 14/500 [00:04<02:42,  3.00it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.00it/s][A
  3%|▎         | 16/500 [00:04<02:41,  2.99it/s][A
  3%|▎         | 17/500 [00:05<02:41,  2.99it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 19/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 20/500 [00:06<02:40,  3.00it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:01,  3.08it/s][A
 63%|██████▎   | 313/500 [01:43<01:00,  3.07it/s][A
 63%|██████▎   | 314/500 [01:43<01:00,  3.07it/s][A
 63%|██████▎   | 315/500 [01:43<01:00,  3.06it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.05it/s][A
 63%|██████▎   | 317/500 [01:44<00:59,  3.06it/s][A
 64%|██████▎   | 318/500 [01:44<00:59,  3.06it/s][A
 64%|██████▍   | 319/500 [01:45<00:58,  3.07it/s][A
 64%|██████▍   | 320/500 [01:45<00:58,  3.06it/s][A
 64%|██████▍   | 321/500 [01:45<00:58,  3.06it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.06it/s][A
 65%|██████▍   | 323/500 [01:46<00:57,  3.08it/s][A
 65%|██████▍   | 324/500 [01:46<00:57,  3.09it/s][A
 65%|██████▌   | 325/500 [01:47<00:56,  3.08it/s][A
 65%|██████▌   | 326/500 [01:47<00:56,  3.08it/s][A
 65%|██████▌   | 327/500 [01:47<00:56,  3.04it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.05it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.03it

loss: 1.777, val_loss: 2.009, acc: 0.565, val_acc: 0.513, time: 177.064

Learning rate is dropped!




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 48



  0%|          | 2/500 [00:00<02:40,  3.09it/s][A
  1%|          | 3/500 [00:00<02:41,  3.08it/s][A
  1%|          | 4/500 [00:00<02:41,  3.07it/s][A
  1%|          | 5/500 [00:01<02:41,  3.06it/s][A
  1%|          | 6/500 [00:01<02:41,  3.05it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.04it/s][A
  2%|▏         | 8/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 9/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.04it/s][A
  2%|▏         | 11/500 [00:03<02:40,  3.04it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.03it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.02it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.02it/s][A
  3%|▎         | 15/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 16/500 [00:04<02:39,  3.03it/s][A
  3%|▎         | 17/500 [00:05<02:38,  3.05it/s][A
  4%|▎         | 18/500 [00:05<02:38,  3.05it/s][A
  4%|▍         | 19/500 [00:05<02:37,  3.05it/s][A
  4%|▍         | 20/500 [00:06<02:37,  3.04it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.03it/s][A
 63%|██████▎   | 316/500 [01:44<01:00,  3.02it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.02it/s][A
 64%|██████▎   | 318/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 319/500 [01:45<00:59,  3.04it/s][A
 64%|██████▍   | 320/500 [01:45<00:58,  3.05it/s][A
 64%|██████▍   | 321/500 [01:46<00:58,  3.05it/s][A
 64%|██████▍   | 322/500 [01:46<00:58,  3.04it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.04it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.03it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.03it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.03it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.02it

loss: 1.780, val_loss: 2.004, acc: 0.564, val_acc: 0.514, time: 177.217

Learning rate is dropped!




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 49



  0%|          | 2/500 [00:00<02:41,  3.09it/s][A
  1%|          | 3/500 [00:00<02:42,  3.06it/s][A
  1%|          | 4/500 [00:00<02:42,  3.06it/s][A
  1%|          | 5/500 [00:01<02:42,  3.04it/s][A
  1%|          | 6/500 [00:01<02:43,  3.02it/s][A
  1%|▏         | 7/500 [00:01<02:43,  3.01it/s][A
  2%|▏         | 8/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 9/500 [00:02<02:43,  3.01it/s][A
  2%|▏         | 10/500 [00:02<02:42,  3.01it/s][A
  2%|▏         | 11/500 [00:03<02:42,  3.01it/s][A
  2%|▏         | 12/500 [00:03<02:42,  3.01it/s][A
  3%|▎         | 13/500 [00:03<02:41,  3.01it/s][A
  3%|▎         | 14/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 15/500 [00:04<02:41,  3.01it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.01it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.02it/s][A
  4%|▎         | 18/500 [00:05<02:39,  3.03it/s][A
  4%|▍         | 19/500 [00:05<02:38,  3.03it/s][A
  4%|▍         | 20/500 [00:06<02:39,  3.02it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:42<01:02,  3.02it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.03it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:43<01:01,  3.02it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.01it/s][A
 64%|██████▎   | 318/500 [01:44<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 321/500 [01:45<00:59,  3.00it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.01it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:46<00:58,  3.01it/s][A
 65%|██████▌   | 325/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.02it/s][A
 65%|██████▌   | 327/500 [01:47<00:57,  3.03it/s][A
 66%|██████▌   | 328/500 [01:48<00:56,  3.02it/s][A
 66%|██████▌   | 329/500 [01:48<00:56,  3.01it/s][A
 66%|██████▌   | 330/500 [01:48<00:56,  3.01it

loss: 1.779, val_loss: 1.993, acc: 0.565, val_acc: 0.517, time: 176.869

Learning rate is dropped!




  0%|          | 1/500 [00:00<?, ?it/s][A

epoch 50



  0%|          | 2/500 [00:00<02:42,  3.06it/s][A
  1%|          | 3/500 [00:00<02:42,  3.06it/s][A
  1%|          | 4/500 [00:00<02:42,  3.05it/s][A
  1%|          | 5/500 [00:01<02:42,  3.04it/s][A
  1%|          | 6/500 [00:01<02:42,  3.03it/s][A
  1%|▏         | 7/500 [00:01<02:42,  3.03it/s][A
  2%|▏         | 8/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 9/500 [00:02<02:42,  3.02it/s][A
  2%|▏         | 10/500 [00:02<02:41,  3.03it/s][A
  2%|▏         | 11/500 [00:03<02:41,  3.03it/s][A
  2%|▏         | 12/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 13/500 [00:03<02:40,  3.04it/s][A
  3%|▎         | 14/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 15/500 [00:04<02:39,  3.04it/s][A
  3%|▎         | 16/500 [00:04<02:40,  3.02it/s][A
  3%|▎         | 17/500 [00:05<02:39,  3.02it/s][A
  4%|▎         | 18/500 [00:05<02:40,  3.01it/s][A
  4%|▍         | 19/500 [00:05<02:40,  3.00it/s][A
  4%|▍         | 20/500 [00:06<02:40,  2.99it/s][A
  4%|▍         | 21

 62%|██████▏   | 312/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 313/500 [01:43<01:01,  3.04it/s][A
 63%|██████▎   | 314/500 [01:43<01:01,  3.01it/s][A
 63%|██████▎   | 315/500 [01:44<01:01,  3.01it/s][A
 63%|██████▎   | 316/500 [01:44<01:01,  3.00it/s][A
 63%|██████▎   | 317/500 [01:44<01:00,  3.00it/s][A
 64%|██████▎   | 318/500 [01:45<01:00,  3.01it/s][A
 64%|██████▍   | 319/500 [01:45<01:00,  3.00it/s][A
 64%|██████▍   | 320/500 [01:45<00:59,  3.01it/s][A
 64%|██████▍   | 321/500 [01:46<00:59,  3.01it/s][A
 64%|██████▍   | 322/500 [01:46<00:59,  3.02it/s][A
 65%|██████▍   | 323/500 [01:46<00:58,  3.01it/s][A
 65%|██████▍   | 324/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 325/500 [01:47<00:58,  3.00it/s][A
 65%|██████▌   | 326/500 [01:47<00:57,  3.01it/s][A
 65%|██████▌   | 327/500 [01:48<00:57,  3.01it/s][A
 66%|██████▌   | 328/500 [01:48<00:57,  3.00it/s][A
 66%|██████▌   | 329/500 [01:48<00:57,  2.99it/s][A
 66%|██████▌   | 330/500 [01:49<00:56,  2.99it

loss: 1.776, val_loss: 1.997, acc: 0.564, val_acc: 0.516, time: 177.146

Learning rate is dropped!

Writing logs and saving the trained model.
