In [11]:
import os
from random import shuffle
import cv2
import numpy as np
import tensorflow as tf
from tqdm import tqdm
import tflearn
from tflearn.layers.conv import conv_2d, max_pool_2d
from tflearn.layers.core import input_data, dropout, fully_connected
from tflearn.layers.estimator import regression

In [12]:
#Training Parameters
LR = 1e-3
IMG_SIZE = 50
MODEL_NAME = 'dogs-vs-cats-4-layer-covnet'
TRAIN_DIR = 'C:/Users/modak/Anaconda3/envs/TensorFlow_QRC-VT/train/train'
TEST_DIR = 'C:/Users/modak/Anaconda3/envs/TensorFlow_QRC-VT/test/test'

In [13]:
def create_label(image_name):
    word_label = image_name.split('.')[-3]
    word_label = word_label.split('/')[-1]
    #print(word_label)
    if word_label == "cat":
        return np.array([1, 0])
    elif word_label == "dog":
        return np.array([0, 1])


cat




array([1, 0])

In [14]:
def create_train_data():
    """Read image as 50x50 and grayscale"""
    training_data = []
    for img in tqdm(os.listdir(TRAIN_DIR)):
        path = os.path.join(TRAIN_DIR, img)
        img_data = cv2.imread(path, cv2.IMREAD_GRAYSCALE)
        img_data = cv2.resize(img_data, (IMG_SIZE, IMG_SIZE))
        training_data.append([np.array(img_data), create_label(img)])
    shuffle(training_data)

    # Save processed data
    if not os.path.exists('data'):
        os.mkdir('data')
    np.save('data/train.npy', training_data)

    return training_data


In [15]:
def create_test_data():
    test_data = []
    for img in tqdm(os.listdir(TEST_DIR)):
        path = os.path.join(TEST_DIR, img)
        img_num = img.split('.')[0]
        img_data = cv2.imread(path, cv2.IMREAD_GRAYSCALE)
        img_data = cv2.resize(img_data, (IMG_SIZE, IMG_SIZE))
        test_data.append([np.array(img_data), img_num])
    shuffle(test_data)

    # Save processed data
    if not os.path.exists('data'):
        os.mkdir('data')
    np.save('data/test.npy', test_data)

    return test_data

In [16]:
train_data = create_train_data()

  0%|          | 0/25000 [00:00<?, ?it/s]

  0%|          | 49/25000 [00:00<00:51, 482.10it/s]

  0%|          | 94/25000 [00:00<00:53, 463.18it/s]

  1%|          | 139/25000 [00:00<00:54, 458.67it/s]

  1%|          | 185/25000 [00:00<00:54, 457.17it/s]

  1%|          | 233/25000 [00:00<00:54, 457.18it/s]

  1%|          | 271/25000 [00:00<00:59, 415.25it/s]

  1%|          | 306/25000 [00:00<01:01, 400.70it/s]

  1%|▏         | 356/25000 [00:00<00:59, 411.58it/s]

  2%|▏         | 405/25000 [00:00<00:58, 419.30it/s]

  2%|▏         | 453/25000 [00:01<00:57, 424.78it/s]

  2%|▏         | 501/25000 [00:01<00:57, 429.39it/s]

  2%|▏         | 548/25000 [00:01<00:56, 432.20it/s]

  2%|▏         | 596/25000 [00:01<00:56, 435.40it/s]

  3%|▎         | 643/25000 [00:01<00:55, 437.29it/s]

  3%|▎         | 690/25000 [00:01<00:55, 435.05it/s]

  3%|▎         | 742/25000 [00:01<00:55, 439.57it/s]

  3%|▎         | 790/25000 [00:01<00:54, 441.83it/s]

  3%|▎         | 838/25000 [00:01<00:54, 443.60it/s]

  4%|▎         | 886/25000 [00:01<00:54, 444.90it/s]

  4%|▎         | 934/25000 [00:02<00:54, 445.65it/s]

  4%|▍         | 982/25000 [00:02<00:53, 446.71it/s]

  4%|▍         | 1029/25000 [00:02<00:53, 446.99it/s]

  4%|▍         | 1078/25000 [00:02<00:53, 448.78it/s]

  5%|▍         | 1126/25000 [00:02<00:53, 449.69it/s]

  5%|▍         | 1174/25000 [00:02<00:52, 450.30it/s]

  5%|▍         | 1223/25000 [00:02<00:52, 451.75it/s]

  5%|▌         | 1272/25000 [00:02<00:52, 452.94it/s]

  5%|▌         | 1325/25000 [00:02<00:51, 455.58it/s]

  6%|▌         | 1377/25000 [00:03<00:51, 457.43it/s]

  6%|▌         | 1428/25000 [00:03<00:51, 459.01it/s]

  6%|▌         | 1479/25000 [00:03<00:51, 460.33it/s]

  6%|▌         | 1530/25000 [00:03<00:50, 461.07it/s]

  6%|▋         | 1580/25000 [00:03<00:50, 462.14it/s]

  7%|▋         | 1630/25000 [00:03<00:50, 462.68it/s]

  7%|▋         | 1686/25000 [00:03<00:50, 465.14it/s]

  7%|▋         | 1738/25000 [00:03<00:49, 466.29it/s]

  7%|▋         | 1789/25000 [00:03<00:49, 466.74it/s]

  7%|▋         | 1840/25000 [00:03<00:49, 467.64it/s]

  8%|▊         | 1891/25000 [00:04<00:49, 468.50it/s]

  8%|▊         | 1942/25000 [00:04<00:49, 469.23it/s]

  8%|▊         | 1992/25000 [00:04<00:49, 469.03it/s]

  8%|▊         | 2041/25000 [00:04<00:48, 469.48it/s]

  8%|▊         | 2092/25000 [00:04<00:48, 470.37it/s]

  9%|▊         | 2144/25000 [00:04<00:48, 471.44it/s]

  9%|▉         | 2195/25000 [00:04<00:48, 471.90it/s]

  9%|▉         | 2245/25000 [00:04<00:48, 472.45it/s]

  9%|▉         | 2295/25000 [00:04<00:48, 473.00it/s]

  9%|▉         | 2349/25000 [00:04<00:47, 474.19it/s]

 10%|▉         | 2402/25000 [00:05<00:47, 475.15it/s]

 10%|▉         | 2454/25000 [00:05<00:47, 475.60it/s]

 10%|█         | 2505/25000 [00:05<00:47, 475.99it/s]

 10%|█         | 2559/25000 [00:05<00:47, 477.16it/s]

 10%|█         | 2614/25000 [00:05<00:46, 478.41it/s]

 11%|█         | 2667/25000 [00:05<00:46, 479.22it/s]

 11%|█         | 2720/25000 [00:05<00:46, 479.49it/s]

 11%|█         | 2774/25000 [00:05<00:46, 480.31it/s]

 11%|█▏        | 2826/25000 [00:05<00:46, 480.88it/s]

 12%|█▏        | 2878/25000 [00:05<00:45, 481.46it/s]

 12%|█▏        | 2933/25000 [00:06<00:45, 482.54it/s]

 12%|█▏        | 2989/25000 [00:06<00:45, 483.70it/s]

 12%|█▏        | 3043/25000 [00:06<00:45, 484.38it/s]

 12%|█▏        | 3097/25000 [00:06<00:45, 484.23it/s]

 13%|█▎        | 3155/25000 [00:06<00:44, 485.68it/s]

 13%|█▎        | 3209/25000 [00:06<00:44, 486.37it/s]

 13%|█▎        | 3263/25000 [00:06<00:44, 487.02it/s]

 13%|█▎        | 3317/25000 [00:06<00:44, 487.68it/s]

 13%|█▎        | 3371/25000 [00:06<00:44, 488.15it/s]

 14%|█▎        | 3424/25000 [00:07<00:44, 488.61it/s]

 14%|█▍        | 3478/25000 [00:07<00:43, 489.28it/s]

 14%|█▍        | 3532/25000 [00:07<00:43, 489.93it/s]

 14%|█▍        | 3586/25000 [00:07<00:43, 490.32it/s]

 15%|█▍        | 3640/25000 [00:07<00:43, 490.95it/s]

 15%|█▍        | 3693/25000 [00:07<00:43, 491.38it/s]

 15%|█▍        | 3747/25000 [00:07<00:43, 491.91it/s]

 15%|█▌        | 3800/25000 [00:07<00:43, 492.28it/s]

 15%|█▌        | 3853/25000 [00:07<00:42, 492.73it/s]

 16%|█▌        | 3906/25000 [00:07<00:42, 493.14it/s]

 16%|█▌        | 3959/25000 [00:08<00:42, 493.31it/s]

 16%|█▌        | 4012/25000 [00:08<00:42, 493.72it/s]

 16%|█▋        | 4067/25000 [00:08<00:42, 494.34it/s]

 16%|█▋        | 4120/25000 [00:08<00:42, 494.64it/s]

 17%|█▋        | 4173/25000 [00:08<00:42, 494.95it/s]

 17%|█▋        | 4228/25000 [00:08<00:41, 495.50it/s]

 17%|█▋        | 4281/25000 [00:08<00:41, 495.67it/s]

 17%|█▋        | 4335/25000 [00:08<00:41, 496.09it/s]

 18%|█▊        | 4388/25000 [00:08<00:41, 496.36it/s]

 18%|█▊        | 4441/25000 [00:08<00:41, 496.72it/s]

 18%|█▊        | 4494/25000 [00:09<00:41, 495.64it/s]

 18%|█▊        | 4545/25000 [00:09<00:41, 495.77it/s]

 18%|█▊        | 4599/25000 [00:09<00:41, 496.17it/s]

 19%|█▊        | 4653/25000 [00:09<00:40, 496.57it/s]

 19%|█▉        | 4706/25000 [00:09<00:40, 496.91it/s]

 19%|█▉        | 4759/25000 [00:09<00:40, 497.23it/s]

 19%|█▉        | 4812/25000 [00:09<00:40, 497.45it/s]

 19%|█▉        | 4865/25000 [00:09<00:40, 497.60it/s]

 20%|█▉        | 4917/25000 [00:09<00:40, 497.60it/s]

 20%|█▉        | 4971/25000 [00:09<00:40, 497.97it/s]

 20%|██        | 5023/25000 [00:10<00:40, 497.93it/s]

 20%|██        | 5075/25000 [00:10<00:40, 497.95it/s]

 21%|██        | 5128/25000 [00:10<00:39, 498.24it/s]

 21%|██        | 5181/25000 [00:10<00:39, 498.47it/s]

 21%|██        | 5233/25000 [00:10<00:39, 498.59it/s]

 21%|██        | 5285/25000 [00:10<00:39, 498.75it/s]

 21%|██▏       | 5340/25000 [00:10<00:39, 499.18it/s]

 22%|██▏       | 5393/25000 [00:10<00:39, 499.13it/s]

 22%|██▏       | 5446/25000 [00:10<00:39, 499.39it/s]

 22%|██▏       | 5499/25000 [00:11<00:39, 499.61it/s]

 22%|██▏       | 5551/25000 [00:11<00:38, 499.77it/s]

 22%|██▏       | 5608/25000 [00:11<00:38, 500.37it/s]

 23%|██▎       | 5663/25000 [00:11<00:38, 500.74it/s]

 23%|██▎       | 5717/25000 [00:11<00:38, 501.07it/s]

 23%|██▎       | 5771/25000 [00:11<00:38, 500.75it/s]

 23%|██▎       | 5823/25000 [00:11<00:38, 500.86it/s]

 24%|██▎       | 5875/25000 [00:11<00:38, 500.92it/s]

 24%|██▎       | 5930/25000 [00:11<00:38, 501.25it/s]

 24%|██▍       | 5983/25000 [00:11<00:37, 501.41it/s]

 24%|██▍       | 6036/25000 [00:12<00:37, 501.62it/s]

 24%|██▍       | 6089/25000 [00:12<00:37, 501.70it/s]

 25%|██▍       | 6141/25000 [00:12<00:37, 501.66it/s]

 25%|██▍       | 6193/25000 [00:12<00:37, 501.61it/s]

 25%|██▍       | 6246/25000 [00:12<00:37, 501.83it/s]

 25%|██▌       | 6298/25000 [00:12<00:37, 501.93it/s]

 25%|██▌       | 6352/25000 [00:12<00:37, 502.17it/s]

 26%|██▌       | 6404/25000 [00:12<00:37, 502.27it/s]

 26%|██▌       | 6456/25000 [00:12<00:36, 502.37it/s]

 26%|██▌       | 6508/25000 [00:12<00:36, 502.49it/s]

 26%|██▌       | 6560/25000 [00:13<00:36, 502.47it/s]

 26%|██▋       | 6615/25000 [00:13<00:36, 502.77it/s]

 27%|██▋       | 6668/25000 [00:13<00:36, 502.96it/s]

 27%|██▋       | 6721/25000 [00:13<00:36, 503.02it/s]

 27%|██▋       | 6777/25000 [00:13<00:36, 503.39it/s]

 27%|██▋       | 6833/25000 [00:13<00:36, 503.75it/s]

 28%|██▊       | 6887/25000 [00:13<00:35, 503.98it/s]

 28%|██▊       | 6941/25000 [00:13<00:35, 503.98it/s]

 28%|██▊       | 6994/25000 [00:13<00:35, 504.15it/s]

 28%|██▊       | 7047/25000 [00:13<00:35, 504.14it/s]

 28%|██▊       | 7099/25000 [00:14<00:35, 504.14it/s]

 29%|██▊       | 7151/25000 [00:14<00:35, 504.22it/s]

 29%|██▉       | 7204/25000 [00:14<00:35, 504.38it/s]

 29%|██▉       | 7256/25000 [00:14<00:35, 504.09it/s]

 29%|██▉       | 7307/25000 [00:14<00:35, 504.11it/s]

 29%|██▉       | 7359/25000 [00:14<00:34, 504.19it/s]

 30%|██▉       | 7413/25000 [00:14<00:34, 504.39it/s]

 30%|██▉       | 7465/25000 [00:14<00:34, 504.38it/s]

 30%|███       | 7519/25000 [00:14<00:34, 504.62it/s]

 30%|███       | 7572/25000 [00:15<00:34, 504.75it/s]

 30%|███       | 7625/25000 [00:15<00:34, 504.67it/s]

 31%|███       | 7677/25000 [00:15<00:34, 504.62it/s]

 31%|███       | 7728/25000 [00:15<00:34, 504.59it/s]

 31%|███       | 7780/25000 [00:15<00:34, 504.68it/s]

 31%|███▏      | 7835/25000 [00:15<00:33, 504.97it/s]

 32%|███▏      | 7888/25000 [00:15<00:33, 504.68it/s]

 32%|███▏      | 7943/25000 [00:15<00:33, 504.94it/s]

 32%|███▏      | 7995/25000 [00:15<00:33, 504.93it/s]

 32%|███▏      | 8049/25000 [00:15<00:33, 505.10it/s]

 32%|███▏      | 8101/25000 [00:16<00:33, 505.14it/s]

 33%|███▎      | 8153/25000 [00:16<00:33, 505.15it/s]

 33%|███▎      | 8205/25000 [00:16<00:33, 505.27it/s]

 33%|███▎      | 8257/25000 [00:16<00:33, 505.27it/s]

 33%|███▎      | 8309/25000 [00:16<00:33, 505.34it/s]

 33%|███▎      | 8362/25000 [00:16<00:32, 505.44it/s]

 34%|███▎      | 8414/25000 [00:16<00:32, 505.41it/s]

 34%|███▍      | 8466/25000 [00:16<00:32, 505.47it/s]

 34%|███▍      | 8520/25000 [00:16<00:32, 505.62it/s]

 34%|███▍      | 8574/25000 [00:16<00:32, 505.81it/s]

 35%|███▍      | 8628/25000 [00:17<00:32, 505.97it/s]

 35%|███▍      | 8681/25000 [00:17<00:32, 505.93it/s]

 35%|███▍      | 8735/25000 [00:17<00:32, 506.09it/s]

 35%|███▌      | 8789/25000 [00:17<00:32, 506.25it/s]

 35%|███▌      | 8842/25000 [00:17<00:31, 506.32it/s]

 36%|███▌      | 8897/25000 [00:17<00:31, 506.56it/s]

 36%|███▌      | 8951/25000 [00:17<00:31, 506.58it/s]

 36%|███▌      | 9004/25000 [00:17<00:31, 506.62it/s]

 36%|███▌      | 9057/25000 [00:17<00:31, 505.71it/s]

 36%|███▋      | 9106/25000 [00:18<00:31, 503.30it/s]

 37%|███▋      | 9148/25000 [00:18<00:31, 501.03it/s]

 37%|███▋      | 9191/25000 [00:18<00:31, 500.59it/s]

 37%|███▋      | 9230/25000 [00:18<00:31, 498.68it/s]

 37%|███▋      | 9265/25000 [00:18<00:31, 496.78it/s]

 37%|███▋      | 9310/25000 [00:18<00:31, 496.48it/s]

 37%|███▋      | 9364/25000 [00:18<00:31, 496.67it/s]

 38%|███▊      | 9411/25000 [00:18<00:31, 496.51it/s]

 38%|███▊      | 9454/25000 [00:19<00:31, 496.15it/s]

 38%|███▊      | 9497/25000 [00:19<00:31, 495.38it/s]

 38%|███▊      | 9546/25000 [00:19<00:31, 495.19it/s]

 38%|███▊      | 9589/25000 [00:19<00:31, 494.71it/s]

 39%|███▊      | 9631/25000 [00:19<00:31, 491.12it/s]

 39%|███▊      | 9666/25000 [00:19<00:31, 489.21it/s]

 39%|███▉      | 9698/25000 [00:19<00:31, 488.20it/s]

 39%|███▉      | 9730/25000 [00:19<00:31, 486.86it/s]

 39%|███▉      | 9762/25000 [00:20<00:31, 486.02it/s]

 39%|███▉      | 9801/25000 [00:20<00:31, 485.54it/s]

 39%|███▉      | 9838/25000 [00:20<00:31, 484.96it/s]

 39%|███▉      | 9873/25000 [00:20<00:31, 484.01it/s]

 40%|███▉      | 9907/25000 [00:20<00:31, 482.84it/s]

 40%|███▉      | 9939/25000 [00:20<00:31, 481.22it/s]

 40%|███▉      | 9975/25000 [00:20<00:31, 480.56it/s]

 40%|████      | 10012/25000 [00:20<00:31, 480.02it/s]

 40%|████      | 10045/25000 [00:20<00:31, 479.09it/s]

 40%|████      | 10090/25000 [00:21<00:31, 478.95it/s]

 41%|████      | 10126/25000 [00:21<00:31, 477.92it/s]

 41%|████      | 10166/25000 [00:21<00:31, 477.51it/s]

 41%|████      | 10215/25000 [00:21<00:30, 477.55it/s]

 41%|████      | 10268/25000 [00:21<00:30, 477.76it/s]

 41%|████▏     | 10320/25000 [00:21<00:30, 477.90it/s]

 42%|████▏     | 10378/25000 [00:21<00:30, 478.36it/s]

 42%|████▏     | 10428/25000 [00:21<00:30, 478.45it/s]

 42%|████▏     | 10478/25000 [00:21<00:30, 478.53it/s]

 42%|████▏     | 10529/25000 [00:21<00:30, 478.63it/s]

 42%|████▏     | 10579/25000 [00:22<00:30, 478.61it/s]

 43%|████▎     | 10634/25000 [00:22<00:30, 478.86it/s]

 43%|████▎     | 10685/25000 [00:22<00:29, 478.62it/s]

 43%|████▎     | 10734/25000 [00:22<00:29, 478.63it/s]

 43%|████▎     | 10783/25000 [00:22<00:29, 478.52it/s]

 43%|████▎     | 10839/25000 [00:22<00:29, 478.82it/s]

 44%|████▎     | 10892/25000 [00:22<00:29, 479.02it/s]

 44%|████▍     | 10952/25000 [00:22<00:29, 479.50it/s]

 44%|████▍     | 11005/25000 [00:22<00:29, 479.56it/s]

 44%|████▍     | 11057/25000 [00:23<00:29, 479.43it/s]

 44%|████▍     | 11107/25000 [00:23<00:28, 479.30it/s]

 45%|████▍     | 11157/25000 [00:23<00:28, 479.38it/s]

 45%|████▍     | 11206/25000 [00:23<00:28, 479.17it/s]

 45%|████▌     | 11254/25000 [00:23<00:28, 479.10it/s]

 45%|████▌     | 11301/25000 [00:23<00:28, 478.84it/s]

 45%|████▌     | 11352/25000 [00:23<00:28, 478.97it/s]

 46%|████▌     | 11400/25000 [00:23<00:28, 478.76it/s]

 46%|████▌     | 11447/25000 [00:23<00:28, 478.72it/s]

 46%|████▌     | 11494/25000 [00:24<00:28, 478.56it/s]

 46%|████▌     | 11544/25000 [00:24<00:28, 478.62it/s]

 46%|████▋     | 11595/25000 [00:24<00:28, 478.74it/s]

 47%|████▋     | 11649/25000 [00:24<00:27, 478.95it/s]

 47%|████▋     | 11699/25000 [00:24<00:27, 478.89it/s]

 47%|████▋     | 11751/25000 [00:24<00:27, 479.04it/s]

 47%|████▋     | 11803/25000 [00:24<00:27, 479.17it/s]

 47%|████▋     | 11856/25000 [00:24<00:27, 479.34it/s]

 48%|████▊     | 11909/25000 [00:24<00:27, 479.52it/s]

 48%|████▊     | 11964/25000 [00:24<00:27, 479.77it/s]

 48%|████▊     | 12016/25000 [00:25<00:27, 479.86it/s]

 48%|████▊     | 12068/25000 [00:25<00:26, 479.85it/s]

 48%|████▊     | 12119/25000 [00:25<00:26, 479.86it/s]

 49%|████▊     | 12169/25000 [00:25<00:26, 479.71it/s]

 49%|████▉     | 12219/25000 [00:25<00:26, 479.77it/s]

 49%|████▉     | 12276/25000 [00:25<00:26, 480.10it/s]

 49%|████▉     | 12334/25000 [00:25<00:26, 480.49it/s]

 50%|████▉     | 12394/25000 [00:25<00:26, 480.94it/s]

 50%|████▉     | 12449/25000 [00:25<00:26, 480.21it/s]

 50%|████▉     | 12499/25000 [00:26<00:26, 480.16it/s]

 50%|█████     | 12550/25000 [00:26<00:25, 480.25it/s]

 50%|█████     | 12601/25000 [00:26<00:25, 480.36it/s]

 51%|█████     | 12655/25000 [00:26<00:25, 480.57it/s]

 51%|█████     | 12710/25000 [00:26<00:25, 480.82it/s]

 51%|█████     | 12768/25000 [00:26<00:25, 481.18it/s]

 51%|█████▏    | 12825/25000 [00:26<00:25, 481.51it/s]

 52%|█████▏    | 12881/25000 [00:26<00:25, 481.78it/s]

 52%|█████▏    | 12937/25000 [00:26<00:25, 482.05it/s]

 52%|█████▏    | 12998/25000 [00:26<00:24, 482.50it/s]

 52%|█████▏    | 13055/25000 [00:27<00:24, 482.66it/s]

 52%|█████▏    | 13115/25000 [00:27<00:24, 483.09it/s]

 53%|█████▎    | 13172/25000 [00:27<00:24, 483.21it/s]

 53%|█████▎    | 13228/25000 [00:27<00:24, 483.40it/s]

 53%|█████▎    | 13284/25000 [00:27<00:24, 483.65it/s]

 53%|█████▎    | 13341/25000 [00:27<00:24, 483.93it/s]

 54%|█████▎    | 13398/25000 [00:27<00:23, 484.22it/s]

 54%|█████▍    | 13454/25000 [00:27<00:23, 484.38it/s]

 54%|█████▍    | 13509/25000 [00:27<00:23, 483.24it/s]

 54%|█████▍    | 13561/25000 [00:28<00:23, 483.35it/s]

 54%|█████▍    | 13616/25000 [00:28<00:23, 483.56it/s]

 55%|█████▍    | 13671/25000 [00:28<00:23, 483.78it/s]

 55%|█████▍    | 13724/25000 [00:28<00:23, 483.94it/s]

 55%|█████▌    | 13782/25000 [00:28<00:23, 484.26it/s]

 55%|█████▌    | 13836/25000 [00:28<00:23, 482.93it/s]

 56%|█████▌    | 13883/25000 [00:28<00:23, 482.00it/s]

 56%|█████▌    | 13925/25000 [00:28<00:23, 481.22it/s]

 56%|█████▌    | 13971/25000 [00:29<00:22, 481.14it/s]

 56%|█████▌    | 14012/25000 [00:29<00:22, 480.58it/s]

 56%|█████▌    | 14051/25000 [00:29<00:22, 480.15it/s]

 56%|█████▋    | 14097/25000 [00:29<00:22, 480.06it/s]

 57%|█████▋    | 14138/25000 [00:29<00:22, 479.54it/s]

 57%|█████▋    | 14183/25000 [00:29<00:22, 479.42it/s]

 57%|█████▋    | 14231/25000 [00:29<00:22, 479.41it/s]

 57%|█████▋    | 14276/25000 [00:29<00:22, 479.29it/s]

 57%|█████▋    | 14324/25000 [00:29<00:22, 479.26it/s]

 57%|█████▋    | 14370/25000 [00:29<00:22, 479.18it/s]

 58%|█████▊    | 14419/25000 [00:30<00:22, 479.21it/s]

 58%|█████▊    | 14465/25000 [00:30<00:21, 479.10it/s]

 58%|█████▊    | 14512/25000 [00:30<00:21, 479.04it/s]

 58%|█████▊    | 14558/25000 [00:30<00:21, 478.95it/s]

 58%|█████▊    | 14606/25000 [00:30<00:21, 478.95it/s]

 59%|█████▊    | 14653/25000 [00:30<00:21, 478.62it/s]

 59%|█████▉    | 14698/25000 [00:30<00:21, 478.28it/s]

 59%|█████▉    | 14749/25000 [00:30<00:21, 478.36it/s]

 59%|█████▉    | 14794/25000 [00:30<00:21, 478.22it/s]

 59%|█████▉    | 14839/25000 [00:31<00:21, 477.65it/s]

 60%|█████▉    | 14883/25000 [00:31<00:21, 477.51it/s]

 60%|█████▉    | 14928/25000 [00:31<00:21, 477.40it/s]

 60%|█████▉    | 14971/25000 [00:31<00:21, 477.22it/s]

 60%|██████    | 15014/25000 [00:31<00:20, 476.93it/s]

 60%|██████    | 15059/25000 [00:31<00:20, 476.83it/s]

 60%|██████    | 15107/25000 [00:31<00:20, 476.84it/s]

 61%|██████    | 15152/25000 [00:31<00:20, 476.70it/s]

 61%|██████    | 15198/25000 [00:31<00:20, 476.64it/s]

 61%|██████    | 15247/25000 [00:31<00:20, 476.66it/s]

 61%|██████    | 15295/25000 [00:32<00:20, 476.66it/s]

 61%|██████▏   | 15353/25000 [00:32<00:20, 476.96it/s]

 62%|██████▏   | 15403/25000 [00:32<00:20, 476.87it/s]

 62%|██████▏   | 15453/25000 [00:32<00:20, 476.91it/s]

 62%|██████▏   | 15502/25000 [00:32<00:19, 476.60it/s]

 62%|██████▏   | 15548/25000 [00:32<00:19, 476.54it/s]

 62%|██████▏   | 15594/25000 [00:32<00:19, 476.44it/s]

 63%|██████▎   | 15641/25000 [00:32<00:19, 476.41it/s]

 63%|██████▎   | 15689/25000 [00:32<00:19, 476.40it/s]

 63%|██████▎   | 15736/25000 [00:33<00:19, 476.36it/s]

 63%|██████▎   | 15787/25000 [00:33<00:19, 476.45it/s]

 63%|██████▎   | 15835/25000 [00:33<00:19, 476.20it/s]

 64%|██████▎   | 15881/25000 [00:33<00:19, 475.14it/s]

 64%|██████▎   | 15921/25000 [00:33<00:19, 474.24it/s]

 64%|██████▍   | 15958/25000 [00:33<00:19, 473.41it/s]

 64%|██████▍   | 15992/25000 [00:33<00:19, 472.60it/s]

 64%|██████▍   | 16024/25000 [00:33<00:19, 471.97it/s]

 64%|██████▍   | 16068/25000 [00:34<00:18, 471.84it/s]

 64%|██████▍   | 16118/25000 [00:34<00:18, 471.92it/s]

 65%|██████▍   | 16167/25000 [00:34<00:18, 471.94it/s]

 65%|██████▍   | 16217/25000 [00:34<00:18, 472.02it/s]

 65%|██████▌   | 16262/25000 [00:34<00:18, 471.78it/s]

 65%|██████▌   | 16308/25000 [00:34<00:18, 471.72it/s]

 65%|██████▌   | 16357/25000 [00:34<00:18, 471.73it/s]

 66%|██████▌   | 16405/25000 [00:34<00:18, 471.76it/s]

 66%|██████▌   | 16453/25000 [00:34<00:18, 471.75it/s]

 66%|██████▌   | 16500/25000 [00:35<00:18, 471.27it/s]

 66%|██████▌   | 16543/25000 [00:35<00:17, 471.01it/s]

 66%|██████▋   | 16585/25000 [00:35<00:17, 470.45it/s]

 67%|██████▋   | 16634/25000 [00:35<00:17, 470.47it/s]

 67%|██████▋   | 16678/25000 [00:35<00:17, 470.38it/s]

 67%|██████▋   | 16721/25000 [00:35<00:17, 470.18it/s]

 67%|██████▋   | 16767/25000 [00:35<00:17, 470.14it/s]

 67%|██████▋   | 16818/25000 [00:35<00:17, 470.22it/s]

 67%|██████▋   | 16867/25000 [00:35<00:17, 470.25it/s]

 68%|██████▊   | 16913/25000 [00:35<00:17, 469.86it/s]

 68%|██████▊   | 16956/25000 [00:36<00:17, 468.67it/s]

 68%|██████▊   | 16994/25000 [00:36<00:17, 467.64it/s]

 68%|██████▊   | 17028/25000 [00:36<00:17, 466.83it/s]

 68%|██████▊   | 17059/25000 [00:36<00:17, 466.17it/s]

 68%|██████▊   | 17091/25000 [00:36<00:16, 465.74it/s]

 68%|██████▊   | 17121/25000 [00:36<00:16, 464.98it/s]

 69%|██████▊   | 17150/25000 [00:36<00:16, 464.33it/s]

 69%|██████▉   | 17197/25000 [00:37<00:16, 464.33it/s]

 69%|██████▉   | 17231/25000 [00:37<00:16, 463.98it/s]

 69%|██████▉   | 17265/25000 [00:37<00:16, 463.30it/s]

 69%|██████▉   | 17300/25000 [00:37<00:16, 462.97it/s]

 69%|██████▉   | 17344/25000 [00:37<00:16, 462.90it/s]

 70%|██████▉   | 17395/25000 [00:37<00:16, 463.00it/s]

 70%|██████▉   | 17443/25000 [00:37<00:16, 463.02it/s]

 70%|██████▉   | 17487/25000 [00:37<00:16, 462.96it/s]

 70%|███████   | 17530/25000 [00:37<00:16, 462.87it/s]

 70%|███████   | 17573/25000 [00:37<00:16, 462.69it/s]

 70%|███████   | 17615/25000 [00:38<00:15, 462.29it/s]

 71%|███████   | 17663/25000 [00:38<00:15, 462.31it/s]

 71%|███████   | 17710/25000 [00:38<00:15, 462.32it/s]

 71%|███████   | 17757/25000 [00:38<00:15, 462.33it/s]

 71%|███████   | 17809/25000 [00:38<00:15, 462.46it/s]

 71%|███████▏  | 17856/25000 [00:38<00:15, 461.51it/s]

 72%|███████▏  | 17897/25000 [00:38<00:15, 460.76it/s]

 72%|███████▏  | 17934/25000 [00:38<00:15, 460.40it/s]

 72%|███████▏  | 17980/25000 [00:39<00:15, 460.38it/s]

 72%|███████▏  | 18027/25000 [00:39<00:15, 460.39it/s]

 72%|███████▏  | 18075/25000 [00:39<00:15, 460.43it/s]

 72%|███████▏  | 18124/25000 [00:39<00:14, 460.51it/s]

 73%|███████▎  | 18174/25000 [00:39<00:14, 460.58it/s]

 73%|███████▎  | 18221/25000 [00:39<00:14, 460.59it/s]

 73%|███████▎  | 18269/25000 [00:39<00:14, 460.62it/s]

 73%|███████▎  | 18316/25000 [00:39<00:14, 460.62it/s]

 73%|███████▎  | 18364/25000 [00:39<00:14, 460.67it/s]

 74%|███████▎  | 18411/25000 [00:39<00:14, 460.66it/s]

 74%|███████▍  | 18460/25000 [00:40<00:14, 460.72it/s]

 74%|███████▍  | 18508/25000 [00:40<00:14, 460.77it/s]

 74%|███████▍  | 18558/25000 [00:40<00:13, 460.87it/s]

 74%|███████▍  | 18607/25000 [00:40<00:13, 460.88it/s]

 75%|███████▍  | 18656/25000 [00:40<00:13, 460.94it/s]

 75%|███████▍  | 18704/25000 [00:40<00:13, 460.17it/s]

 75%|███████▍  | 18746/25000 [00:40<00:13, 459.43it/s]

 75%|███████▌  | 18784/25000 [00:40<00:13, 458.23it/s]

 75%|███████▌  | 18837/25000 [00:41<00:13, 458.40it/s]

 76%|███████▌  | 18883/25000 [00:41<00:13, 458.39it/s]

 76%|███████▌  | 18924/25000 [00:41<00:13, 457.46it/s]

 76%|███████▌  | 18960/25000 [00:41<00:13, 456.31it/s]

 76%|███████▌  | 18991/25000 [00:41<00:13, 455.83it/s]

 76%|███████▌  | 19035/25000 [00:41<00:13, 455.77it/s]

 76%|███████▋  | 19082/25000 [00:41<00:12, 455.80it/s]

 76%|███████▋  | 19120/25000 [00:41<00:12, 455.59it/s]

 77%|███████▋  | 19160/25000 [00:42<00:12, 455.45it/s]

 77%|███████▋  | 19204/25000 [00:42<00:12, 455.41it/s]

 77%|███████▋  | 19246/25000 [00:42<00:12, 455.32it/s]

 77%|███████▋  | 19290/25000 [00:42<00:12, 455.28it/s]

 77%|███████▋  | 19333/25000 [00:42<00:12, 455.21it/s]

 78%|███████▊  | 19376/25000 [00:42<00:12, 455.15it/s]

 78%|███████▊  | 19423/25000 [00:42<00:12, 455.17it/s]

 78%|███████▊  | 19467/25000 [00:42<00:12, 455.10it/s]

 78%|███████▊  | 19511/25000 [00:42<00:12, 454.78it/s]

 78%|███████▊  | 19556/25000 [00:43<00:11, 454.75it/s]

 78%|███████▊  | 19607/25000 [00:43<00:11, 454.87it/s]

 79%|███████▊  | 19656/25000 [00:43<00:11, 454.95it/s]

 79%|███████▉  | 19704/25000 [00:43<00:11, 455.00it/s]

 79%|███████▉  | 19755/25000 [00:43<00:11, 455.11it/s]

 79%|███████▉  | 19803/25000 [00:43<00:11, 455.02it/s]

 79%|███████▉  | 19854/25000 [00:43<00:11, 455.13it/s]

 80%|███████▉  | 19905/25000 [00:43<00:11, 455.25it/s]

 80%|███████▉  | 19954/25000 [00:43<00:11, 455.30it/s]

 80%|████████  | 20002/25000 [00:43<00:10, 455.30it/s]

 80%|████████  | 20050/25000 [00:44<00:10, 454.50it/s]

 80%|████████  | 20091/25000 [00:44<00:10, 453.83it/s]

 81%|████████  | 20138/25000 [00:44<00:10, 453.86it/s]

 81%|████████  | 20188/25000 [00:44<00:10, 453.96it/s]

 81%|████████  | 20231/25000 [00:44<00:10, 453.80it/s]

 81%|████████  | 20282/25000 [00:44<00:10, 453.92it/s]

 81%|████████▏ | 20327/25000 [00:44<00:10, 453.73it/s]

 82%|████████▏ | 20377/25000 [00:44<00:10, 453.83it/s]

 82%|████████▏ | 20428/25000 [00:45<00:10, 453.95it/s]

 82%|████████▏ | 20477/25000 [00:45<00:09, 454.02it/s]

 82%|████████▏ | 20526/25000 [00:45<00:09, 454.10it/s]

 82%|████████▏ | 20574/25000 [00:45<00:09, 454.08it/s]

 82%|████████▏ | 20621/25000 [00:45<00:09, 453.31it/s]

 83%|████████▎ | 20662/25000 [00:45<00:09, 452.14it/s]

 83%|████████▎ | 20708/25000 [00:45<00:09, 452.14it/s]

 83%|████████▎ | 20757/25000 [00:45<00:09, 452.21it/s]

 83%|████████▎ | 20805/25000 [00:46<00:09, 452.27it/s]

 83%|████████▎ | 20854/25000 [00:46<00:09, 452.34it/s]

 84%|████████▎ | 20908/25000 [00:46<00:09, 452.49it/s]

 84%|████████▍ | 20958/25000 [00:46<00:08, 452.59it/s]

 84%|████████▍ | 21010/25000 [00:46<00:08, 452.72it/s]

 84%|████████▍ | 21059/25000 [00:46<00:08, 452.77it/s]

 84%|████████▍ | 21108/25000 [00:46<00:08, 452.71it/s]

 85%|████████▍ | 21155/25000 [00:46<00:08, 452.02it/s]

 85%|████████▍ | 21196/25000 [00:46<00:08, 451.75it/s]

 85%|████████▍ | 21235/25000 [00:47<00:08, 451.17it/s]

 85%|████████▌ | 21271/25000 [00:47<00:08, 450.63it/s]

 85%|████████▌ | 21304/25000 [00:47<00:08, 450.27it/s]

 85%|████████▌ | 21347/25000 [00:47<00:08, 450.23it/s]

 86%|████████▌ | 21383/25000 [00:47<00:08, 450.03it/s]

 86%|████████▌ | 21419/25000 [00:47<00:07, 449.51it/s]

 86%|████████▌ | 21452/25000 [00:47<00:07, 449.06it/s]

 86%|████████▌ | 21484/25000 [00:47<00:07, 448.64it/s]

 86%|████████▌ | 21519/25000 [00:47<00:07, 448.42it/s]

 86%|████████▌ | 21558/25000 [00:48<00:07, 448.26it/s]

 86%|████████▋ | 21592/25000 [00:48<00:07, 447.55it/s]

 86%|████████▋ | 21623/25000 [00:48<00:07, 447.26it/s]

 87%|████████▋ | 21677/25000 [00:48<00:07, 447.44it/s]

 87%|████████▋ | 21722/25000 [00:48<00:07, 447.43it/s]

 87%|████████▋ | 21762/25000 [00:48<00:07, 446.75it/s]

 87%|████████▋ | 21797/25000 [00:48<00:07, 445.45it/s]

 87%|████████▋ | 21827/25000 [00:49<00:07, 444.58it/s]

 87%|████████▋ | 21853/25000 [00:49<00:07, 443.64it/s]

 88%|████████▊ | 21888/25000 [00:49<00:07, 443.44it/s]

 88%|████████▊ | 21930/25000 [00:49<00:06, 443.38it/s]

 88%|████████▊ | 21978/25000 [00:49<00:06, 443.44it/s]

 88%|████████▊ | 22026/25000 [00:49<00:06, 443.50it/s]

 88%|████████▊ | 22072/25000 [00:49<00:06, 443.52it/s]

 88%|████████▊ | 22122/25000 [00:49<00:06, 443.62it/s]

 89%|████████▊ | 22166/25000 [00:49<00:06, 443.59it/s]

 89%|████████▉ | 22218/25000 [00:50<00:06, 443.73it/s]

 89%|████████▉ | 22268/25000 [00:50<00:06, 443.84it/s]

 89%|████████▉ | 22320/25000 [00:50<00:06, 443.98it/s]

 89%|████████▉ | 22373/25000 [00:50<00:05, 444.15it/s]

 90%|████████▉ | 22423/25000 [00:50<00:05, 444.24it/s]

 90%|████████▉ | 22473/25000 [00:50<00:05, 443.94it/s]

 90%|█████████ | 22518/25000 [00:50<00:05, 443.93it/s]

 90%|█████████ | 22567/25000 [00:50<00:05, 444.02it/s]

 90%|█████████ | 22614/25000 [00:50<00:05, 444.07it/s]

 91%|█████████ | 22668/25000 [00:51<00:05, 444.25it/s]

 91%|█████████ | 22717/25000 [00:51<00:05, 444.28it/s]

 91%|█████████ | 22770/25000 [00:51<00:05, 444.42it/s]

 91%|█████████▏| 22819/25000 [00:51<00:04, 444.49it/s]

 91%|█████████▏| 22868/25000 [00:51<00:04, 443.83it/s]

 92%|█████████▏| 22910/25000 [00:51<00:04, 443.41it/s]

 92%|█████████▏| 22952/25000 [00:51<00:04, 443.36it/s]

 92%|█████████▏| 22999/25000 [00:51<00:04, 443.39it/s]

 92%|█████████▏| 23047/25000 [00:51<00:04, 443.45it/s]

 92%|█████████▏| 23096/25000 [00:52<00:04, 443.52it/s]

 93%|█████████▎| 23145/25000 [00:52<00:04, 443.61it/s]

 93%|█████████▎| 23193/25000 [00:52<00:04, 443.66it/s]

 93%|█████████▎| 23243/25000 [00:52<00:03, 443.75it/s]

 93%|█████████▎| 23292/25000 [00:52<00:03, 443.84it/s]

 93%|█████████▎| 23340/25000 [00:52<00:03, 443.39it/s]

 94%|█████████▎| 23383/25000 [00:52<00:03, 442.68it/s]

 94%|█████████▎| 23420/25000 [00:52<00:03, 442.21it/s]

 94%|█████████▍| 23454/25000 [00:53<00:03, 441.92it/s]

 94%|█████████▍| 23503/25000 [00:53<00:03, 442.00it/s]

 94%|█████████▍| 23550/25000 [00:53<00:03, 442.04it/s]

 94%|█████████▍| 23597/25000 [00:53<00:03, 442.09it/s]

 95%|█████████▍| 23644/25000 [00:53<00:03, 442.13it/s]

 95%|█████████▍| 23689/25000 [00:53<00:02, 442.13it/s]

 95%|█████████▍| 23739/25000 [00:53<00:02, 442.23it/s]

 95%|█████████▌| 23785/25000 [00:53<00:02, 442.20it/s]

 95%|█████████▌| 23830/25000 [00:53<00:02, 441.41it/s]

 95%|█████████▌| 23869/25000 [00:54<00:02, 440.98it/s]

 96%|█████████▌| 23916/25000 [00:54<00:02, 441.02it/s]

 96%|█████████▌| 23967/25000 [00:54<00:02, 441.14it/s]

 96%|█████████▌| 24019/25000 [00:54<00:02, 441.28it/s]

 96%|█████████▋| 24064/25000 [00:54<00:02, 440.87it/s]

 96%|█████████▋| 24105/25000 [00:54<00:02, 439.50it/s]

 97%|█████████▋| 24138/25000 [00:55<00:01, 438.73it/s]

 97%|█████████▋| 24167/25000 [00:55<00:01, 438.31it/s]

 97%|█████████▋| 24199/25000 [00:55<00:01, 438.09it/s]

 97%|█████████▋| 24242/25000 [00:55<00:01, 438.05it/s]

 97%|█████████▋| 24275/25000 [00:55<00:01, 437.82it/s]

 97%|█████████▋| 24325/25000 [00:55<00:01, 437.93it/s]

 97%|█████████▋| 24373/25000 [00:55<00:01, 437.99it/s]

 98%|█████████▊| 24414/25000 [00:55<00:01, 437.67it/s]

 98%|█████████▊| 24452/25000 [00:55<00:01, 436.99it/s]

 98%|█████████▊| 24502/25000 [00:56<00:01, 437.10it/s]

 98%|█████████▊| 24553/25000 [00:56<00:01, 437.23it/s]

 98%|█████████▊| 24602/25000 [00:56<00:00, 437.32it/s]

 99%|█████████▊| 24651/25000 [00:56<00:00, 437.39it/s]

 99%|█████████▉| 24697/25000 [00:56<00:00, 437.43it/s]

 99%|█████████▉| 24744/25000 [00:56<00:00, 437.48it/s]

 99%|█████████▉| 24790/25000 [00:56<00:00, 437.44it/s]

 99%|█████████▉| 24835/25000 [00:56<00:00, 437.43it/s]

100%|█████████▉| 24889/25000 [00:56<00:00, 437.61it/s]

100%|█████████▉| 24936/25000 [00:57<00:00, 437.40it/s]

100%|█████████▉| 24980/25000 [00:57<00:00, 437.34it/s]

100%|██████████| 25000/25000 [00:57<00:00, 437.14it/s]




In [17]:
test_data = create_test_data()


  0%|          | 0/12500 [00:00<?, ?it/s]

  0%|          | 17/12500 [00:00<01:14, 168.45it/s]

  0%|          | 34/12500 [00:00<01:15, 165.69it/s]

  0%|          | 45/12500 [00:00<01:48, 114.77it/s]

  0%|          | 53/12500 [00:00<02:33, 81.27it/s] 

  1%|          | 82/12500 [00:00<01:54, 108.86it/s]

  1%|          | 137/12500 [00:00<01:17, 160.05it/s]

  1%|▏         | 163/12500 [00:01<01:24, 145.48it/s]

  1%|▏         | 186/12500 [00:01<01:20, 152.16it/s]

  2%|▏         | 224/12500 [00:01<01:12, 169.37it/s]

  2%|▏         | 263/12500 [00:01<01:06, 184.70it/s]

  2%|▏         | 293/12500 [00:01<01:07, 181.58it/s]

  3%|▎         | 321/12500 [00:01<01:05, 187.12it/s]

  3%|▎         | 348/12500 [00:01<01:04, 189.70it/s]

  3%|▎         | 379/12500 [00:01<01:02, 194.47it/s]

  3%|▎         | 425/12500 [00:02<00:58, 205.86it/s]

  4%|▎         | 464/12500 [00:02<00:56, 214.09it/s]

  4%|▍         | 497/12500 [00:02<00:56, 211.32it/s]

  4%|▍         | 526/12500 [00:02<00:55, 214.01it/s]

  5%|▍         | 571/12500 [00:02<00:53, 223.01it/s]

  5%|▍         | 622/12500 [00:02<00:50, 233.76it/s]

  5%|▌         | 668/12500 [00:02<00:48, 241.82it/s]

  6%|▌         | 715/12500 [00:02<00:47, 249.68it/s]

  6%|▌         | 764/12500 [00:02<00:45, 257.78it/s]

  6%|▋         | 811/12500 [00:03<00:44, 264.54it/s]

  7%|▋         | 862/12500 [00:03<00:42, 272.17it/s]

  7%|▋         | 912/12500 [00:03<00:41, 279.01it/s]

  8%|▊         | 963/12500 [00:03<00:40, 285.76it/s]

  8%|▊         | 1012/12500 [00:03<00:39, 290.79it/s]

  8%|▊         | 1060/12500 [00:03<00:38, 295.72it/s]

  9%|▉         | 1110/12500 [00:03<00:37, 301.16it/s]

  9%|▉         | 1158/12500 [00:03<00:37, 305.84it/s]

 10%|▉         | 1209/12500 [00:03<00:36, 310.85it/s]

 10%|█         | 1258/12500 [00:04<00:35, 313.77it/s]

 10%|█         | 1304/12500 [00:04<00:35, 314.17it/s]

 11%|█         | 1346/12500 [00:04<00:35, 314.27it/s]

 11%|█         | 1395/12500 [00:04<00:34, 318.24it/s]

 12%|█▏        | 1441/12500 [00:04<00:34, 321.36it/s]

 12%|█▏        | 1490/12500 [00:04<00:33, 324.99it/s]

 12%|█▏        | 1536/12500 [00:04<00:33, 327.75it/s]

 13%|█▎        | 1587/12500 [00:04<00:32, 331.37it/s]

 13%|█▎        | 1634/12500 [00:04<00:32, 333.81it/s]

 13%|█▎        | 1686/12500 [00:04<00:32, 337.47it/s]

 14%|█▍        | 1734/12500 [00:05<00:31, 339.83it/s]

 14%|█▍        | 1783/12500 [00:05<00:31, 342.71it/s]

 15%|█▍        | 1833/12500 [00:05<00:30, 345.66it/s]

 15%|█▌        | 1883/12500 [00:05<00:30, 348.38it/s]

 15%|█▌        | 1934/12500 [00:05<00:30, 351.23it/s]

 16%|█▌        | 1983/12500 [00:05<00:29, 353.15it/s]

 16%|█▌        | 2031/12500 [00:05<00:29, 354.99it/s]

 17%|█▋        | 2079/12500 [00:05<00:29, 356.60it/s]

 17%|█▋        | 2130/12500 [00:05<00:28, 359.12it/s]

 17%|█▋        | 2178/12500 [00:06<00:28, 357.76it/s]

 18%|█▊        | 2222/12500 [00:06<00:28, 359.07it/s]

 18%|█▊        | 2272/12500 [00:06<00:28, 361.27it/s]

 19%|█▊        | 2323/12500 [00:06<00:27, 363.60it/s]

 19%|█▉        | 2376/12500 [00:06<00:27, 366.06it/s]

 19%|█▉        | 2426/12500 [00:06<00:27, 368.06it/s]

 20%|█▉        | 2478/12500 [00:06<00:27, 370.30it/s]

 20%|██        | 2528/12500 [00:06<00:26, 371.90it/s]

 21%|██        | 2577/12500 [00:06<00:26, 372.49it/s]

 21%|██        | 2624/12500 [00:07<00:26, 371.62it/s]

 21%|██▏       | 2667/12500 [00:07<00:26, 370.19it/s]

 22%|██▏       | 2731/12500 [00:07<00:26, 373.85it/s]

 22%|██▏       | 2793/12500 [00:07<00:25, 377.08it/s]

 23%|██▎       | 2854/12500 [00:07<00:25, 380.08it/s]

 23%|██▎       | 2913/12500 [00:07<00:25, 382.80it/s]

 24%|██▍       | 2971/12500 [00:07<00:24, 385.29it/s]

 24%|██▍       | 3031/12500 [00:07<00:24, 388.02it/s]

 25%|██▍       | 3091/12500 [00:07<00:24, 390.65it/s]

 25%|██▌       | 3149/12500 [00:08<00:23, 392.38it/s]

 26%|██▌       | 3205/12500 [00:08<00:23, 393.81it/s]

 26%|██▌       | 3259/12500 [00:08<00:23, 394.04it/s]

 26%|██▋       | 3312/12500 [00:08<00:23, 395.65it/s]

 27%|██▋       | 3363/12500 [00:08<00:23, 396.44it/s]

 27%|██▋       | 3416/12500 [00:08<00:22, 397.92it/s]

 28%|██▊       | 3467/12500 [00:08<00:22, 399.13it/s]

 28%|██▊       | 3518/12500 [00:08<00:22, 399.60it/s]

 29%|██▊       | 3567/12500 [00:08<00:22, 398.36it/s]

 29%|██▉       | 3611/12500 [00:09<00:22, 395.23it/s]

 29%|██▉       | 3664/12500 [00:09<00:22, 396.68it/s]

 30%|██▉       | 3712/12500 [00:09<00:22, 397.48it/s]

 30%|███       | 3756/12500 [00:09<00:22, 395.13it/s]

 30%|███       | 3795/12500 [00:09<00:22, 393.02it/s]

 31%|███       | 3845/12500 [00:09<00:21, 394.02it/s]

 31%|███       | 3884/12500 [00:09<00:21, 393.72it/s]

 31%|███▏      | 3923/12500 [00:09<00:21, 393.39it/s]

 32%|███▏      | 3975/12500 [00:10<00:21, 394.57it/s]

 32%|███▏      | 4024/12500 [00:10<00:21, 395.49it/s]

 33%|███▎      | 4075/12500 [00:10<00:21, 396.58it/s]

 33%|███▎      | 4125/12500 [00:10<00:21, 397.57it/s]

 33%|███▎      | 4173/12500 [00:10<00:20, 397.47it/s]

 34%|███▍      | 4221/12500 [00:10<00:20, 398.22it/s]

 34%|███▍      | 4272/12500 [00:10<00:20, 399.23it/s]

 35%|███▍      | 4324/12500 [00:10<00:20, 400.29it/s]

 35%|███▌      | 4375/12500 [00:10<00:20, 401.29it/s]

 35%|███▌      | 4427/12500 [00:11<00:20, 402.35it/s]

 36%|███▌      | 4479/12500 [00:11<00:19, 403.34it/s]

 36%|███▌      | 4530/12500 [00:11<00:19, 403.76it/s]

 37%|███▋      | 4579/12500 [00:11<00:19, 404.47it/s]

 37%|███▋      | 4628/12500 [00:11<00:19, 405.08it/s]

 37%|███▋      | 4677/12500 [00:11<00:19, 405.60it/s]

 38%|███▊      | 4728/12500 [00:11<00:19, 406.48it/s]

 38%|███▊      | 4779/12500 [00:11<00:18, 407.35it/s]

 39%|███▊      | 4829/12500 [00:11<00:18, 408.02it/s]

 39%|███▉      | 4882/12500 [00:11<00:18, 409.03it/s]

 39%|███▉      | 4936/12500 [00:12<00:18, 410.04it/s]

 40%|███▉      | 4990/12500 [00:12<00:18, 411.06it/s]

 40%|████      | 5045/12500 [00:12<00:18, 412.10it/s]

 41%|████      | 5098/12500 [00:12<00:17, 412.83it/s]

 41%|████      | 5151/12500 [00:12<00:17, 413.71it/s]

 42%|████▏     | 5203/12500 [00:12<00:17, 414.54it/s]

 42%|████▏     | 5255/12500 [00:12<00:17, 414.49it/s]

 42%|████▏     | 5305/12500 [00:12<00:17, 415.15it/s]

 43%|████▎     | 5358/12500 [00:12<00:17, 416.01it/s]

 43%|████▎     | 5410/12500 [00:12<00:17, 416.78it/s]

 44%|████▎     | 5461/12500 [00:13<00:16, 417.40it/s]

 44%|████▍     | 5512/12500 [00:13<00:16, 418.10it/s]

 45%|████▍     | 5563/12500 [00:13<00:16, 418.59it/s]

 45%|████▍     | 5616/12500 [00:13<00:16, 419.41it/s]

 45%|████▌     | 5667/12500 [00:13<00:16, 419.97it/s]

 46%|████▌     | 5719/12500 [00:13<00:16, 420.68it/s]

 46%|████▌     | 5771/12500 [00:13<00:15, 421.38it/s]

 47%|████▋     | 5822/12500 [00:13<00:15, 421.97it/s]

 47%|████▋     | 5875/12500 [00:13<00:15, 422.72it/s]

 47%|████▋     | 5927/12500 [00:14<00:15, 422.92it/s]

 48%|████▊     | 5977/12500 [00:14<00:15, 423.44it/s]

 48%|████▊     | 6031/12500 [00:14<00:15, 424.22it/s]

 49%|████▊     | 6082/12500 [00:14<00:15, 424.74it/s]

 49%|████▉     | 6134/12500 [00:14<00:14, 425.37it/s]

 49%|████▉     | 6187/12500 [00:14<00:14, 426.04it/s]

 50%|████▉     | 6239/12500 [00:14<00:14, 426.42it/s]

 50%|█████     | 6290/12500 [00:14<00:14, 426.97it/s]

 51%|█████     | 6342/12500 [00:14<00:14, 427.54it/s]

 51%|█████     | 6393/12500 [00:14<00:14, 428.01it/s]

 52%|█████▏    | 6444/12500 [00:15<00:14, 428.49it/s]

 52%|█████▏    | 6504/12500 [00:15<00:13, 429.62it/s]

 52%|█████▏    | 6560/12500 [00:15<00:13, 430.47it/s]

 53%|█████▎    | 6618/12500 [00:15<00:13, 431.39it/s]

 53%|█████▎    | 6675/12500 [00:15<00:13, 432.26it/s]

 54%|█████▍    | 6732/12500 [00:15<00:13, 433.14it/s]

 54%|█████▍    | 6788/12500 [00:15<00:13, 433.62it/s]

 55%|█████▍    | 6843/12500 [00:15<00:13, 433.84it/s]

 55%|█████▌    | 6895/12500 [00:15<00:12, 433.71it/s]

 56%|█████▌    | 6944/12500 [00:16<00:12, 433.84it/s]

 56%|█████▌    | 6999/12500 [00:16<00:12, 434.53it/s]

 56%|█████▋    | 7049/12500 [00:16<00:12, 434.72it/s]

 57%|█████▋    | 7100/12500 [00:16<00:12, 435.10it/s]

 57%|█████▋    | 7152/12500 [00:16<00:12, 435.62it/s]

 58%|█████▊    | 7203/12500 [00:16<00:12, 436.05it/s]

 58%|█████▊    | 7257/12500 [00:16<00:12, 436.63it/s]

 58%|█████▊    | 7309/12500 [00:16<00:11, 436.79it/s]

 59%|█████▉    | 7360/12500 [00:16<00:11, 437.22it/s]

 59%|█████▉    | 7414/12500 [00:16<00:11, 437.78it/s]

 60%|█████▉    | 7465/12500 [00:17<00:11, 438.14it/s]

 60%|██████    | 7518/12500 [00:17<00:11, 438.67it/s]

 61%|██████    | 7570/12500 [00:17<00:11, 438.98it/s]

 61%|██████    | 7621/12500 [00:17<00:11, 439.31it/s]

 61%|██████▏   | 7672/12500 [00:17<00:10, 438.93it/s]

 62%|██████▏   | 7719/12500 [00:17<00:10, 438.28it/s]

 62%|██████▏   | 7764/12500 [00:17<00:10, 438.30it/s]

 63%|██████▎   | 7816/12500 [00:17<00:10, 438.71it/s]

 63%|██████▎   | 7866/12500 [00:17<00:10, 439.02it/s]

 63%|██████▎   | 7913/12500 [00:18<00:10, 438.98it/s]

 64%|██████▎   | 7964/12500 [00:18<00:10, 439.31it/s]

 64%|██████▍   | 8014/12500 [00:18<00:10, 439.61it/s]

 65%|██████▍   | 8064/12500 [00:18<00:10, 439.92it/s]

 65%|██████▍   | 8114/12500 [00:18<00:09, 440.19it/s]

 65%|██████▌   | 8167/12500 [00:18<00:09, 440.63it/s]

 66%|██████▌   | 8220/12500 [00:18<00:09, 441.09it/s]

 66%|██████▌   | 8273/12500 [00:18<00:09, 441.54it/s]

 67%|██████▋   | 8325/12500 [00:18<00:09, 441.84it/s]

 67%|██████▋   | 8376/12500 [00:18<00:09, 442.14it/s]

 67%|██████▋   | 8427/12500 [00:19<00:09, 442.46it/s]

 68%|██████▊   | 8479/12500 [00:19<00:09, 442.86it/s]

 68%|██████▊   | 8531/12500 [00:19<00:08, 443.26it/s]

 69%|██████▊   | 8583/12500 [00:19<00:08, 443.50it/s]

 69%|██████▉   | 8634/12500 [00:19<00:08, 443.74it/s]

 70%|██████▉   | 8688/12500 [00:19<00:08, 444.19it/s]

 70%|██████▉   | 8739/12500 [00:19<00:08, 444.51it/s]

 70%|███████   | 8791/12500 [00:19<00:08, 444.88it/s]

 71%|███████   | 8843/12500 [00:19<00:08, 445.15it/s]

 71%|███████   | 8894/12500 [00:19<00:08, 445.47it/s]

 72%|███████▏  | 8948/12500 [00:20<00:07, 445.93it/s]

 72%|███████▏  | 9000/12500 [00:20<00:07, 446.14it/s]

 72%|███████▏  | 9052/12500 [00:20<00:07, 446.46it/s]

 73%|███████▎  | 9105/12500 [00:20<00:07, 446.86it/s]

 73%|███████▎  | 9157/12500 [00:20<00:07, 447.12it/s]

 74%|███████▎  | 9209/12500 [00:20<00:07, 447.44it/s]

 74%|███████▍  | 9260/12500 [00:20<00:07, 447.74it/s]

 74%|███████▍  | 9311/12500 [00:20<00:07, 447.93it/s]

 75%|███████▍  | 9363/12500 [00:20<00:06, 448.26it/s]

 75%|███████▌  | 9414/12500 [00:20<00:06, 448.50it/s]

 76%|███████▌  | 9465/12500 [00:21<00:06, 448.74it/s]

 76%|███████▌  | 9517/12500 [00:21<00:06, 449.03it/s]

 77%|███████▋  | 9569/12500 [00:21<00:06, 449.32it/s]

 77%|███████▋  | 9621/12500 [00:21<00:06, 449.63it/s]

 77%|███████▋  | 9672/12500 [00:21<00:06, 449.80it/s]

 78%|███████▊  | 9726/12500 [00:21<00:06, 450.17it/s]

 78%|███████▊  | 9777/12500 [00:21<00:06, 450.39it/s]

 79%|███████▊  | 9830/12500 [00:21<00:05, 450.70it/s]

 79%|███████▉  | 9881/12500 [00:21<00:05, 450.97it/s]

 79%|███████▉  | 9934/12500 [00:22<00:05, 451.29it/s]

 80%|███████▉  | 9986/12500 [00:22<00:05, 451.52it/s]

 80%|████████  | 10037/12500 [00:22<00:05, 451.69it/s]

 81%|████████  | 10088/12500 [00:22<00:05, 451.87it/s]

 81%|████████  | 10147/12500 [00:22<00:05, 452.47it/s]

 82%|████████▏ | 10203/12500 [00:22<00:05, 452.91it/s]

 82%|████████▏ | 10264/12500 [00:22<00:04, 453.57it/s]

 83%|████████▎ | 10321/12500 [00:22<00:04, 454.06it/s]

 83%|████████▎ | 10377/12500 [00:22<00:04, 454.43it/s]

 83%|████████▎ | 10433/12500 [00:22<00:04, 454.89it/s]

 84%|████████▍ | 10489/12500 [00:23<00:04, 455.15it/s]

 84%|████████▍ | 10543/12500 [00:23<00:04, 455.34it/s]

 85%|████████▍ | 10596/12500 [00:23<00:04, 455.55it/s]

 85%|████████▌ | 10651/12500 [00:23<00:04, 455.93it/s]

 86%|████████▌ | 10704/12500 [00:23<00:03, 456.11it/s]

 86%|████████▌ | 10756/12500 [00:23<00:03, 456.21it/s]

 86%|████████▋ | 10807/12500 [00:23<00:03, 455.87it/s]

 87%|████████▋ | 10859/12500 [00:23<00:03, 456.13it/s]

 87%|████████▋ | 10909/12500 [00:23<00:03, 456.31it/s]

 88%|████████▊ | 10958/12500 [00:24<00:03, 455.83it/s]

 88%|████████▊ | 11011/12500 [00:24<00:03, 456.13it/s]

 89%|████████▊ | 11063/12500 [00:24<00:03, 456.38it/s]

 89%|████████▉ | 11115/12500 [00:24<00:03, 456.64it/s]

 89%|████████▉ | 11165/12500 [00:24<00:02, 456.33it/s]

 90%|████████▉ | 11220/12500 [00:24<00:02, 456.69it/s]

 90%|█████████ | 11273/12500 [00:24<00:02, 456.96it/s]

 91%|█████████ | 11323/12500 [00:24<00:02, 457.00it/s]

 91%|█████████ | 11376/12500 [00:24<00:02, 457.27it/s]

 91%|█████████▏| 11427/12500 [00:24<00:02, 457.45it/s]

 92%|█████████▏| 11479/12500 [00:25<00:02, 457.68it/s]

 92%|█████████▏| 11530/12500 [00:25<00:02, 457.87it/s]

 93%|█████████▎| 11581/12500 [00:25<00:02, 458.03it/s]

 93%|█████████▎| 11632/12500 [00:25<00:01, 458.15it/s]

 93%|█████████▎| 11683/12500 [00:25<00:01, 458.33it/s]

 94%|█████████▍| 11734/12500 [00:25<00:01, 458.51it/s]

 94%|█████████▍| 11785/12500 [00:25<00:01, 458.68it/s]

 95%|█████████▍| 11836/12500 [00:25<00:01, 458.83it/s]

 95%|█████████▌| 11886/12500 [00:25<00:01, 458.95it/s]

 95%|█████████▌| 11936/12500 [00:25<00:01, 459.09it/s]

 96%|█████████▌| 11989/12500 [00:26<00:01, 459.35it/s]

 96%|█████████▋| 12040/12500 [00:26<00:01, 459.50it/s]

 97%|█████████▋| 12091/12500 [00:26<00:00, 459.66it/s]

 97%|█████████▋| 12142/12500 [00:26<00:00, 459.78it/s]

 98%|█████████▊| 12193/12500 [00:26<00:00, 459.95it/s]

 98%|█████████▊| 12245/12500 [00:26<00:00, 460.14it/s]

 98%|█████████▊| 12296/12500 [00:26<00:00, 460.30it/s]

 99%|█████████▉| 12349/12500 [00:26<00:00, 460.55it/s]

 99%|█████████▉| 12400/12500 [00:26<00:00, 460.71it/s]

100%|█████████▉| 12451/12500 [00:27<00:00, 460.82it/s]

100%|██████████| 12500/12500 [00:27<00:00, 460.96it/s]




In [18]:
train_len = len(train_data)
print(train_len)

25000

In [19]:
train = train_data[:-500]
test = train_data[-500:]

In [20]:
X_train = np.array([i[0] for i in train]).reshape(-1, IMG_SIZE, IMG_SIZE, 1)
Y_train = [i[1] for i in train]

X_test = np.array([i[0] for i in test]).reshape(-1, IMG_SIZE, IMG_SIZE, 1)
Y_test = [i[1] for i in test]


In [23]:
 ## Build the model
tf.reset_default_graph()

convnet = input_data(shape=[None, IMG_SIZE, IMG_SIZE, 1], name='input')

convnet = conv_2d(convnet, 32, 5, activation='relu')
convnet = max_pool_2d(convnet, 5)

convnet = conv_2d(convnet, 64, 5, activation='relu')
convnet = max_pool_2d(convnet, 5)

convnet = conv_2d(convnet, 64, 5, activation='relu')
convnet = max_pool_2d(convnet, 5)

convnet = fully_connected(convnet, 1024, activation='relu')
convnet = dropout(convnet, 0.8)

convnet = fully_connected(convnet, 2, activation='softmax')
convnet = regression(convnet, optimizer='adam', learning_rate=LR, loss='categorical_crossentropy', name='targets')

model = tflearn.DNN(convnet, tensorboard_dir='log')

In [107]:
model.fit({'input': X_train}, {'targets': Y_train}, n_epoch=5, 
          validation_set=({'input': X_test}, {'targets': Y_test}), 
          snapshot_step=500, show_metric=True, run_id=MODEL_NAME)

model.save(MODEL_NAME)

---------------------------------




Run id: dogs-vs-cats-4-layer-covnet




Log directory: log/




INFO:tensorflow:Summary name Accuracy/ (raw) is illegal; using Accuracy/__raw_ instead.




---------------------------------




Training samples: 24500




Validation samples: 500




--




Training Step: 1  | time: 0.372s


| Adam | epoch: 001 | loss: 0.00000 - acc: 0.0000 -- iter: 00064/24500


Training Step: 2  | total loss: 

1.31031

 | time: 0.593s


| Adam | epoch: 001 | loss: 1.31031 - acc: 0.5062 -- iter: 00128/24500


Training Step: 3  | total loss: 

8.80860

 | time: 0.825s


| Adam | epoch: 001 | loss: 8.80860 - acc: 0.5267 -- iter: 00192/24500


Training Step: 4  | total loss: 

7.94305

 | time: 1.052s


| Adam | epoch: 001 | loss: 7.94305 - acc: 0.4481 -- iter: 00256/24500


Training Step: 5  | total loss: 

2.95845

 | time: 1.282s


| Adam | epoch: 001 | loss: 2.95845 - acc: 0.5706 -- iter: 00320/24500


Training Step: 6  | total loss: 

1.51136

 | time: 1.507s


| Adam | epoch: 001 | loss: 1.51136 - acc: 0.5754 -- iter: 00384/24500


Training Step: 7  | total loss: 

1.83074

 | time: 1.744s


| Adam | epoch: 001 | loss: 1.83074 - acc: 0.5302 -- iter: 00448/24500


Training Step: 8  | total loss: 

1.38827

 | time: 1.985s


| Adam | epoch: 001 | loss: 1.38827 - acc: 0.5659 -- iter: 00512/24500


Training Step: 9  | total loss: 

1.04489

 | time: 2.216s


| Adam | epoch: 001 | loss: 1.04489 - acc: 0.6055 -- iter: 00576/24500


Training Step: 10  | total loss: 

0.92804

 | time: 2.460s


| Adam | epoch: 001 | loss: 0.92804 - acc: 0.5918 -- iter: 00640/24500


Training Step: 11  | total loss: 

0.82058

 | time: 2.697s


| Adam | epoch: 001 | loss: 0.82058 - acc: 0.5705 -- iter: 00704/24500


Training Step: 12  | total loss: 

0.75649

 | time: 2.930s


| Adam | epoch: 001 | loss: 0.75649 - acc: 0.5458 -- iter: 00768/24500


Training Step: 13  | total loss: 

0.74409

 | time: 3.170s


| Adam | epoch: 001 | loss: 0.74409 - acc: 0.5329 -- iter: 00832/24500


Training Step: 14  | total loss: 

0.71983

 | time: 3.400s


| Adam | epoch: 001 | loss: 0.71983 - acc: 0.5130 -- iter: 00896/24500


Training Step: 15  | total loss: 

0.71630

 | time: 3.648s


| Adam | epoch: 001 | loss: 0.71630 - acc: 0.5263 -- iter: 00960/24500


Training Step: 16  | total loss: 

0.74532

 | time: 3.875s


| Adam | epoch: 001 | loss: 0.74532 - acc: 0.4813 -- iter: 01024/24500


Training Step: 17  | total loss: 

0.72995

 | time: 4.113s


| Adam | epoch: 001 | loss: 0.72995 - acc: 0.5049 -- iter: 01088/24500


Training Step: 18  | total loss: 

0.72255

 | time: 4.340s


| Adam | epoch: 001 | loss: 0.72255 - acc: 0.5032 -- iter: 01152/24500


Training Step: 19  | total loss: 

0.71808

 | time: 4.572s


| Adam | epoch: 001 | loss: 0.71808 - acc: 0.5230 -- iter: 01216/24500


Training Step: 20  | total loss: 

0.72130

 | time: 4.802s


| Adam | epoch: 001 | loss: 0.72130 - acc: 0.5256 -- iter: 01280/24500


Training Step: 21  | total loss: 

0.73009

 | time: 5.040s


| Adam | epoch: 001 | loss: 0.73009 - acc: 0.5225 -- iter: 01344/24500


Training Step: 22  | total loss: 

0.73447

 | time: 5.279s


| Adam | epoch: 001 | loss: 0.73447 - acc: 0.4830 -- iter: 01408/24500


Training Step: 23  | total loss: 

0.71838

 | time: 5.519s


| Adam | epoch: 001 | loss: 0.71838 - acc: 0.5060 -- iter: 01472/24500


Training Step: 24  | total loss: 

0.76165

 | time: 5.745s


| Adam | epoch: 001 | loss: 0.76165 - acc: 0.4868 -- iter: 01536/24500


Training Step: 25  | total loss: 

0.73507

 | time: 5.967s


| Adam | epoch: 001 | loss: 0.73507 - acc: 0.4946 -- iter: 01600/24500


Training Step: 26  | total loss: 

0.72138

 | time: 6.180s


| Adam | epoch: 001 | loss: 0.72138 - acc: 0.5250 -- iter: 01664/24500


Training Step: 27  | total loss: 

0.71270

 | time: 6.393s


| Adam | epoch: 001 | loss: 0.71270 - acc: 0.5347 -- iter: 01728/24500


Training Step: 28  | total loss: 

0.71289

 | time: 6.614s


| Adam | epoch: 001 | loss: 0.71289 - acc: 0.5260 -- iter: 01792/24500


Training Step: 29  | total loss: 

0.68851

 | time: 6.831s


| Adam | epoch: 001 | loss: 0.68851 - acc: 0.5881 -- iter: 01856/24500


Training Step: 30  | total loss: 

0.68864

 | time: 7.045s


| Adam | epoch: 001 | loss: 0.68864 - acc: 0.5746 -- iter: 01920/24500


Training Step: 31  | total loss: 

0.68726

 | time: 7.263s


| Adam | epoch: 001 | loss: 0.68726 - acc: 0.5682 -- iter: 01984/24500


Training Step: 32  | total loss: 

0.69245

 | time: 7.478s


| Adam | epoch: 001 | loss: 0.69245 - acc: 0.5634 -- iter: 02048/24500


Training Step: 33  | total loss: 

0.68624

 | time: 7.694s


| Adam | epoch: 001 | loss: 0.68624 - acc: 0.5701 -- iter: 02112/24500


Training Step: 34  | total loss: 

0.69182

 | time: 7.915s


| Adam | epoch: 001 | loss: 0.69182 - acc: 0.5651 -- iter: 02176/24500


Training Step: 35  | total loss: 

0.69280

 | time: 8.136s


| Adam | epoch: 001 | loss: 0.69280 - acc: 0.5547 -- iter: 02240/24500


Training Step: 36  | total loss: 

0.68921

 | time: 8.349s


| Adam | epoch: 001 | loss: 0.68921 - acc: 0.5563 -- iter: 02304/24500


Training Step: 37  | total loss: 

0.68949

 | time: 8.570s


| Adam | epoch: 001 | loss: 0.68949 - acc: 0.5607 -- iter: 02368/24500


Training Step: 38  | total loss: 

0.68631

 | time: 8.796s


| Adam | epoch: 001 | loss: 0.68631 - acc: 0.5672 -- iter: 02432/24500


Training Step: 39  | total loss: 

0.70175

 | time: 9.014s


| Adam | epoch: 001 | loss: 0.70175 - acc: 0.5423 -- iter: 02496/24500


Training Step: 40  | total loss: 

0.69607

 | time: 9.236s


| Adam | epoch: 001 | loss: 0.69607 - acc: 0.5549 -- iter: 02560/24500


Training Step: 41  | total loss: 

0.69861

 | time: 9.466s


| Adam | epoch: 001 | loss: 0.69861 - acc: 0.5592 -- iter: 02624/24500


Training Step: 42  | total loss: 

0.69445

 | time: 9.689s


| Adam | epoch: 001 | loss: 0.69445 - acc: 0.5682 -- iter: 02688/24500


Training Step: 43  | total loss: 

0.69761

 | time: 9.902s


| Adam | epoch: 001 | loss: 0.69761 - acc: 0.5672 -- iter: 02752/24500


Training Step: 44  | total loss: 

0.68584

 | time: 10.115s


| Adam | epoch: 001 | loss: 0.68584 - acc: 0.5745 -- iter: 02816/24500


Training Step: 45  | total loss: 

0.68246

 | time: 10.328s


| Adam | epoch: 001 | loss: 0.68246 - acc: 0.5804 -- iter: 02880/24500


Training Step: 46  | total loss: 

0.67400

 | time: 10.544s


| Adam | epoch: 001 | loss: 0.67400 - acc: 0.5852 -- iter: 02944/24500


Training Step: 47  | total loss: 

0.68061

 | time: 10.756s


| Adam | epoch: 001 | loss: 0.68061 - acc: 0.5790 -- iter: 03008/24500


Training Step: 48  | total loss: 

0.68752

 | time: 10.978s


| Adam | epoch: 001 | loss: 0.68752 - acc: 0.5688 -- iter: 03072/24500


Training Step: 49  | total loss: 

0.68860

 | time: 11.192s


| Adam | epoch: 001 | loss: 0.68860 - acc: 0.5653 -- iter: 03136/24500


Training Step: 50  | total loss: 

0.68074

 | time: 11.410s


| Adam | epoch: 001 | loss: 0.68074 - acc: 0.5867 -- iter: 03200/24500


Training Step: 51  | total loss: 

0.67980

 | time: 11.629s


| Adam | epoch: 001 | loss: 0.67980 - acc: 0.5830 -- iter: 03264/24500


Training Step: 52  | total loss: 

0.67610

 | time: 11.849s


| Adam | epoch: 001 | loss: 0.67610 - acc: 0.5823 -- iter: 03328/24500


Training Step: 53  | total loss: 

0.67560

 | time: 12.066s


| Adam | epoch: 001 | loss: 0.67560 - acc: 0.5840 -- iter: 03392/24500


Training Step: 54  | total loss: 

0.67947

 | time: 12.278s


| Adam | epoch: 001 | loss: 0.67947 - acc: 0.5763 -- iter: 03456/24500


Training Step: 55  | total loss: 

0.67613

 | time: 12.499s


| Adam | epoch: 001 | loss: 0.67613 - acc: 0.5900 -- iter: 03520/24500


Training Step: 56  | total loss: 

0.67914

 | time: 12.724s


| Adam | epoch: 001 | loss: 0.67914 - acc: 0.5795 -- iter: 03584/24500


Training Step: 57  | total loss: 

0.68291

 | time: 12.937s


| Adam | epoch: 001 | loss: 0.68291 - acc: 0.5663 -- iter: 03648/24500


Training Step: 58  | total loss: 

0.68328

 | time: 13.153s


| Adam | epoch: 001 | loss: 0.68328 - acc: 0.5701 -- iter: 03712/24500


Training Step: 59  | total loss: 

0.67801

 | time: 13.367s


| Adam | epoch: 001 | loss: 0.67801 - acc: 0.5796 -- iter: 03776/24500


Training Step: 60  | total loss: 

0.67612

 | time: 13.593s


| Adam | epoch: 001 | loss: 0.67612 - acc: 0.5856 -- iter: 03840/24500


Training Step: 61  | total loss: 

0.68831

 | time: 13.818s


| Adam | epoch: 001 | loss: 0.68831 - acc: 0.5703 -- iter: 03904/24500


Training Step: 62  | total loss: 

0.69763

 | time: 14.034s


| Adam | epoch: 001 | loss: 0.69763 - acc: 0.5553 -- iter: 03968/24500


Training Step: 63  | total loss: 

0.70026

 | time: 14.253s


| Adam | epoch: 001 | loss: 0.70026 - acc: 0.5483 -- iter: 04032/24500


Training Step: 64  | total loss: 

0.69039

 | time: 14.468s


| Adam | epoch: 001 | loss: 0.69039 - acc: 0.5637 -- iter: 04096/24500


Training Step: 65  | total loss: 

0.69255

 | time: 14.681s


| Adam | epoch: 001 | loss: 0.69255 - acc: 0.5578 -- iter: 04160/24500


Training Step: 66  | total loss: 

0.68839

 | time: 14.904s


| Adam | epoch: 001 | loss: 0.68839 - acc: 0.5660 -- iter: 04224/24500


Training Step: 67  | total loss: 

0.68756

 | time: 15.125s


| Adam | epoch: 001 | loss: 0.68756 - acc: 0.5712 -- iter: 04288/24500


Training Step: 68  | total loss: 

0.68360

 | time: 15.344s


| Adam | epoch: 001 | loss: 0.68360 - acc: 0.5775 -- iter: 04352/24500


Training Step: 69  | total loss: 

0.69523

 | time: 15.564s


| Adam | epoch: 001 | loss: 0.69523 - acc: 0.5612 -- iter: 04416/24500


Training Step: 70  | total loss: 

0.69518

 | time: 15.783s


| Adam | epoch: 001 | loss: 0.69518 - acc: 0.5595 -- iter: 04480/24500


Training Step: 71  | total loss: 

0.69134

 | time: 16.003s


| Adam | epoch: 001 | loss: 0.69134 - acc: 0.5599 -- iter: 04544/24500


Training Step: 72  | total loss: 

0.69553

 | time: 16.225s


| Adam | epoch: 001 | loss: 0.69553 - acc: 0.5602 -- iter: 04608/24500


Training Step: 73  | total loss: 

0.70213

 | time: 16.444s


| Adam | epoch: 001 | loss: 0.70213 - acc: 0.5535 -- iter: 04672/24500


Training Step: 74  | total loss: 

0.70248

 | time: 16.663s


| Adam | epoch: 001 | loss: 0.70248 - acc: 0.5459 -- iter: 04736/24500


Training Step: 75  | total loss: 

0.69684

 | time: 16.889s


| Adam | epoch: 001 | loss: 0.69684 - acc: 0.5528 -- iter: 04800/24500


Training Step: 76  | total loss: 

0.69428

 | time: 17.108s


| Adam | epoch: 001 | loss: 0.69428 - acc: 0.5488 -- iter: 04864/24500


Training Step: 77  | total loss: 

0.69236

 | time: 17.331s


| Adam | epoch: 001 | loss: 0.69236 - acc: 0.5536 -- iter: 04928/24500


Training Step: 78  | total loss: 

0.69141

 | time: 17.548s


| Adam | epoch: 001 | loss: 0.69141 - acc: 0.5545 -- iter: 04992/24500


Training Step: 79  | total loss: 

0.69423

 | time: 17.766s


| Adam | epoch: 001 | loss: 0.69423 - acc: 0.5505 -- iter: 05056/24500


Training Step: 80  | total loss: 

0.69354

 | time: 17.989s


| Adam | epoch: 001 | loss: 0.69354 - acc: 0.5437 -- iter: 05120/24500


Training Step: 81  | total loss: 

0.69128

 | time: 18.219s


| Adam | epoch: 001 | loss: 0.69128 - acc: 0.5535 -- iter: 05184/24500


Training Step: 82  | total loss: 

0.69194

 | time: 18.434s


| Adam | epoch: 001 | loss: 0.69194 - acc: 0.5497 -- iter: 05248/24500


Training Step: 83  | total loss: 

0.69024

 | time: 18.654s


| Adam | epoch: 001 | loss: 0.69024 - acc: 0.5651 -- iter: 05312/24500


Training Step: 84  | total loss: 

0.68939

 | time: 18.875s


| Adam | epoch: 001 | loss: 0.68939 - acc: 0.5742 -- iter: 05376/24500


Training Step: 85  | total loss: 

0.68736

 | time: 19.097s


| Adam | epoch: 001 | loss: 0.68736 - acc: 0.5746 -- iter: 05440/24500


Training Step: 86  | total loss: 

0.68697

 | time: 19.315s


| Adam | epoch: 001 | loss: 0.68697 - acc: 0.5781 -- iter: 05504/24500


Training Step: 87  | total loss: 

0.68212

 | time: 19.538s


| Adam | epoch: 001 | loss: 0.68212 - acc: 0.5874 -- iter: 05568/24500


Training Step: 88  | total loss: 

0.67949

 | time: 19.751s


| Adam | epoch: 001 | loss: 0.67949 - acc: 0.5943 -- iter: 05632/24500


Training Step: 89  | total loss: 

0.68328

 | time: 19.972s


| Adam | epoch: 001 | loss: 0.68328 - acc: 0.5943 -- iter: 05696/24500


Training Step: 90  | total loss: 

0.67925

 | time: 20.190s


| Adam | epoch: 001 | loss: 0.67925 - acc: 0.5989 -- iter: 05760/24500


Training Step: 91  | total loss: 

0.67884

 | time: 20.406s


| Adam | epoch: 001 | loss: 0.67884 - acc: 0.5953 -- iter: 05824/24500


Training Step: 92  | total loss: 

0.67587

 | time: 20.625s


| Adam | epoch: 001 | loss: 0.67587 - acc: 0.5951 -- iter: 05888/24500


Training Step: 93  | total loss: 

0.68049

 | time: 20.842s


| Adam | epoch: 001 | loss: 0.68049 - acc: 0.5872 -- iter: 05952/24500


Training Step: 94  | total loss: 

0.67289

 | time: 21.067s


| Adam | epoch: 001 | loss: 0.67289 - acc: 0.6003 -- iter: 06016/24500


Training Step: 95  | total loss: 

0.66948

 | time: 21.282s


| Adam | epoch: 001 | loss: 0.66948 - acc: 0.6043 -- iter: 06080/24500


Training Step: 96  | total loss: 

0.67391

 | time: 21.506s


| Adam | epoch: 001 | loss: 0.67391 - acc: 0.5986 -- iter: 06144/24500


Training Step: 97  | total loss: 

0.67502

 | time: 21.728s


| Adam | epoch: 001 | loss: 0.67502 - acc: 0.5934 -- iter: 06208/24500


Training Step: 98  | total loss: 

0.67410

 | time: 21.944s


| Adam | epoch: 001 | loss: 0.67410 - acc: 0.5950 -- iter: 06272/24500


Training Step: 99  | total loss: 

0.68267

 | time: 22.162s


| Adam | epoch: 001 | loss: 0.68267 - acc: 0.5855 -- iter: 06336/24500


Training Step: 100  | total loss: 

0.67921

 | time: 22.385s


| Adam | epoch: 001 | loss: 0.67921 - acc: 0.5926 -- iter: 06400/24500


Training Step: 101  | total loss: 

0.67501

 | time: 22.611s


| Adam | epoch: 001 | loss: 0.67501 - acc: 0.5958 -- iter: 06464/24500


Training Step: 102  | total loss: 

0.67902

 | time: 22.827s


| Adam | epoch: 001 | loss: 0.67902 - acc: 0.5925 -- iter: 06528/24500


Training Step: 103  | total loss: 

0.67103

 | time: 23.049s


| Adam | epoch: 001 | loss: 0.67103 - acc: 0.6083 -- iter: 06592/24500


Training Step: 104  | total loss: 

0.66799

 | time: 23.267s


| Adam | epoch: 001 | loss: 0.66799 - acc: 0.6021 -- iter: 06656/24500


Training Step: 105  | total loss: 

0.66446

 | time: 23.486s


| Adam | epoch: 001 | loss: 0.66446 - acc: 0.6138 -- iter: 06720/24500


Training Step: 106  | total loss: 

0.66938

 | time: 23.707s


| Adam | epoch: 001 | loss: 0.66938 - acc: 0.5993 -- iter: 06784/24500


Training Step: 107  | total loss: 

0.67415

 | time: 23.930s


| Adam | epoch: 001 | loss: 0.67415 - acc: 0.5893 -- iter: 06848/24500


Training Step: 108  | total loss: 

0.67419

 | time: 24.153s


| Adam | epoch: 001 | loss: 0.67419 - acc: 0.5867 -- iter: 06912/24500


Training Step: 109  | total loss: 

0.67280

 | time: 24.378s


| Adam | epoch: 001 | loss: 0.67280 - acc: 0.5889 -- iter: 06976/24500


Training Step: 110  | total loss: 

0.67209

 | time: 24.599s


| Adam | epoch: 001 | loss: 0.67209 - acc: 0.5894 -- iter: 07040/24500


Training Step: 111  | total loss: 

0.66790

 | time: 24.819s


| Adam | epoch: 001 | loss: 0.66790 - acc: 0.5977 -- iter: 07104/24500


Training Step: 112  | total loss: 

0.66518

 | time: 25.039s


| Adam | epoch: 001 | loss: 0.66518 - acc: 0.6035 -- iter: 07168/24500


Training Step: 113  | total loss: 

0.66284

 | time: 25.258s


| Adam | epoch: 001 | loss: 0.66284 - acc: 0.6025 -- iter: 07232/24500


Training Step: 114  | total loss: 

0.66265

 | time: 25.483s


| Adam | epoch: 001 | loss: 0.66265 - acc: 0.6001 -- iter: 07296/24500


Training Step: 115  | total loss: 

0.66389

 | time: 25.704s


| Adam | epoch: 001 | loss: 0.66389 - acc: 0.5995 -- iter: 07360/24500


Training Step: 116  | total loss: 

0.67105

 | time: 25.928s


| Adam | epoch: 001 | loss: 0.67105 - acc: 0.5926 -- iter: 07424/24500


Training Step: 117  | total loss: 

0.66132

 | time: 26.165s


| Adam | epoch: 001 | loss: 0.66132 - acc: 0.6084 -- iter: 07488/24500


Training Step: 118  | total loss: 

0.65543

 | time: 26.386s


| Adam | epoch: 001 | loss: 0.65543 - acc: 0.6147 -- iter: 07552/24500


Training Step: 119  | total loss: 

0.65423

 | time: 26.606s


| Adam | epoch: 001 | loss: 0.65423 - acc: 0.6189 -- iter: 07616/24500


Training Step: 120  | total loss: 

0.64600

 | time: 26.827s


| Adam | epoch: 001 | loss: 0.64600 - acc: 0.6242 -- iter: 07680/24500


Training Step: 121  | total loss: 

0.64874

 | time: 27.048s


| Adam | epoch: 001 | loss: 0.64874 - acc: 0.6305 -- iter: 07744/24500


Training Step: 122  | total loss: 

0.64933

 | time: 27.270s


| Adam | epoch: 001 | loss: 0.64933 - acc: 0.6284 -- iter: 07808/24500


Training Step: 123  | total loss: 

0.64708

 | time: 27.496s


| Adam | epoch: 001 | loss: 0.64708 - acc: 0.6281 -- iter: 07872/24500


Training Step: 124  | total loss: 

0.64738

 | time: 27.707s


| Adam | epoch: 001 | loss: 0.64738 - acc: 0.6340 -- iter: 07936/24500


Training Step: 125  | total loss: 

0.64790

 | time: 27.927s


| Adam | epoch: 001 | loss: 0.64790 - acc: 0.6300 -- iter: 08000/24500


Training Step: 126  | total loss: 

0.65421

 | time: 28.152s


| Adam | epoch: 001 | loss: 0.65421 - acc: 0.6232 -- iter: 08064/24500


Training Step: 127  | total loss: 

0.65469

 | time: 28.385s


| Adam | epoch: 001 | loss: 0.65469 - acc: 0.6281 -- iter: 08128/24500


Training Step: 128  | total loss: 

0.66726

 | time: 28.604s


| Adam | epoch: 001 | loss: 0.66726 - acc: 0.6184 -- iter: 08192/24500


Training Step: 129  | total loss: 

0.66738

 | time: 28.826s


| Adam | epoch: 001 | loss: 0.66738 - acc: 0.6175 -- iter: 08256/24500


Training Step: 130  | total loss: 

0.66887

 | time: 29.051s


| Adam | epoch: 001 | loss: 0.66887 - acc: 0.6120 -- iter: 08320/24500


Training Step: 131  | total loss: 

0.66917

 | time: 29.281s


| Adam | epoch: 001 | loss: 0.66917 - acc: 0.6086 -- iter: 08384/24500


Training Step: 132  | total loss: 

0.66831

 | time: 29.514s


| Adam | epoch: 001 | loss: 0.66831 - acc: 0.6056 -- iter: 08448/24500


Training Step: 133  | total loss: 

0.66953

 | time: 29.739s


| Adam | epoch: 001 | loss: 0.66953 - acc: 0.6044 -- iter: 08512/24500


Training Step: 134  | total loss: 

0.67343

 | time: 29.966s


| Adam | epoch: 001 | loss: 0.67343 - acc: 0.5971 -- iter: 08576/24500


Training Step: 135  | total loss: 

0.66873

 | time: 30.192s


| Adam | epoch: 001 | loss: 0.66873 - acc: 0.5967 -- iter: 08640/24500


Training Step: 136  | total loss: 

0.66875

 | time: 30.451s


| Adam | epoch: 001 | loss: 0.66875 - acc: 0.5964 -- iter: 08704/24500


Training Step: 137  | total loss: 

0.66641

 | time: 30.701s


| Adam | epoch: 001 | loss: 0.66641 - acc: 0.5977 -- iter: 08768/24500


Training Step: 138  | total loss: 

0.66325

 | time: 30.970s


| Adam | epoch: 001 | loss: 0.66325 - acc: 0.5973 -- iter: 08832/24500


Training Step: 139  | total loss: 

0.65453

 | time: 31.216s


| Adam | epoch: 001 | loss: 0.65453 - acc: 0.6173 -- iter: 08896/24500


Training Step: 140  | total loss: 

0.65505

 | time: 31.453s


| Adam | epoch: 001 | loss: 0.65505 - acc: 0.6118 -- iter: 08960/24500


Training Step: 141  | total loss: 

0.65698

 | time: 31.756s


| Adam | epoch: 001 | loss: 0.65698 - acc: 0.6084 -- iter: 09024/24500


Training Step: 142  | total loss: 

0.65821

 | time: 31.988s


| Adam | epoch: 001 | loss: 0.65821 - acc: 0.6101 -- iter: 09088/24500


Training Step: 143  | total loss: 

0.64790

 | time: 32.265s


| Adam | epoch: 001 | loss: 0.64790 - acc: 0.6194 -- iter: 09152/24500


Training Step: 144  | total loss: 

0.65575

 | time: 32.524s


| Adam | epoch: 001 | loss: 0.65575 - acc: 0.6153 -- iter: 09216/24500


Training Step: 145  | total loss: 

0.64803

 | time: 32.767s


| Adam | epoch: 001 | loss: 0.64803 - acc: 0.6256 -- iter: 09280/24500


Training Step: 146  | total loss: 

0.64518

 | time: 32.997s


| Adam | epoch: 001 | loss: 0.64518 - acc: 0.6334 -- iter: 09344/24500


Training Step: 147  | total loss: 

0.64575

 | time: 33.283s


| Adam | epoch: 001 | loss: 0.64575 - acc: 0.6341 -- iter: 09408/24500


Training Step: 148  | total loss: 

0.64100

 | time: 33.564s


| Adam | epoch: 001 | loss: 0.64100 - acc: 0.6410 -- iter: 09472/24500


Training Step: 149  | total loss: 

0.63933

 | time: 33.804s


| Adam | epoch: 001 | loss: 0.63933 - acc: 0.6347 -- iter: 09536/24500


Training Step: 150  | total loss: 

0.62706

 | time: 34.042s


| Adam | epoch: 001 | loss: 0.62706 - acc: 0.6509 -- iter: 09600/24500


Training Step: 151  | total loss: 

0.62454

 | time: 34.289s


| Adam | epoch: 001 | loss: 0.62454 - acc: 0.6577 -- iter: 09664/24500


Training Step: 152  | total loss: 

0.61733

 | time: 34.524s


| Adam | epoch: 001 | loss: 0.61733 - acc: 0.6638 -- iter: 09728/24500


Training Step: 153  | total loss: 

0.63474

 | time: 34.829s


| Adam | epoch: 001 | loss: 0.63474 - acc: 0.6537 -- iter: 09792/24500


Training Step: 154  | total loss: 

0.64331

 | time: 35.068s


| Adam | epoch: 001 | loss: 0.64331 - acc: 0.6430 -- iter: 09856/24500


Training Step: 155  | total loss: 

0.64189

 | time: 35.312s


| Adam | epoch: 001 | loss: 0.64189 - acc: 0.6459 -- iter: 09920/24500


Training Step: 156  | total loss: 

0.64618

 | time: 35.586s


| Adam | epoch: 001 | loss: 0.64618 - acc: 0.6391 -- iter: 09984/24500


Training Step: 157  | total loss: 

0.64025

 | time: 35.860s


| Adam | epoch: 001 | loss: 0.64025 - acc: 0.6455 -- iter: 10048/24500


Training Step: 158  | total loss: 

0.62571

 | time: 36.132s


| Adam | epoch: 001 | loss: 0.62571 - acc: 0.6653 -- iter: 10112/24500


Training Step: 159  | total loss: 

0.63200

 | time: 36.416s


| Adam | epoch: 001 | loss: 0.63200 - acc: 0.6613 -- iter: 10176/24500


Training Step: 160  | total loss: 

0.62945

 | time: 36.692s


| Adam | epoch: 001 | loss: 0.62945 - acc: 0.6592 -- iter: 10240/24500


Training Step: 161  | total loss: 

0.63498

 | time: 36.976s


| Adam | epoch: 001 | loss: 0.63498 - acc: 0.6543 -- iter: 10304/24500


Training Step: 162  | total loss: 

0.63662

 | time: 37.261s


| Adam | epoch: 001 | loss: 0.63662 - acc: 0.6576 -- iter: 10368/24500


Training Step: 163  | total loss: 

0.63300

 | time: 37.550s


| Adam | epoch: 001 | loss: 0.63300 - acc: 0.6621 -- iter: 10432/24500


Training Step: 164  | total loss: 

0.62750

 | time: 37.836s


| Adam | epoch: 001 | loss: 0.62750 - acc: 0.6725 -- iter: 10496/24500


Training Step: 165  | total loss: 

0.62520

 | time: 38.111s


| Adam | epoch: 001 | loss: 0.62520 - acc: 0.6771 -- iter: 10560/24500


Training Step: 166  | total loss: 

0.62481

 | time: 38.395s


| Adam | epoch: 001 | loss: 0.62481 - acc: 0.6735 -- iter: 10624/24500


Training Step: 167  | total loss: 

0.63094

 | time: 38.637s


| Adam | epoch: 001 | loss: 0.63094 - acc: 0.6686 -- iter: 10688/24500


Training Step: 168  | total loss: 

0.63335

 | time: 38.870s


| Adam | epoch: 001 | loss: 0.63335 - acc: 0.6596 -- iter: 10752/24500


Training Step: 169  | total loss: 

0.63844

 | time: 39.122s


| Adam | epoch: 001 | loss: 0.63844 - acc: 0.6592 -- iter: 10816/24500


Training Step: 170  | total loss: 

0.63192

 | time: 39.397s


| Adam | epoch: 001 | loss: 0.63192 - acc: 0.6589 -- iter: 10880/24500


Training Step: 171  | total loss: 

0.63058

 | time: 39.684s


| Adam | epoch: 001 | loss: 0.63058 - acc: 0.6555 -- iter: 10944/24500


Training Step: 172  | total loss: 

0.63241

 | time: 39.967s


| Adam | epoch: 001 | loss: 0.63241 - acc: 0.6462 -- iter: 11008/24500


Training Step: 173  | total loss: 

0.63492

 | time: 40.217s


| Adam | epoch: 001 | loss: 0.63492 - acc: 0.6426 -- iter: 11072/24500


Training Step: 174  | total loss: 

0.64272

 | time: 40.547s


| Adam | epoch: 001 | loss: 0.64272 - acc: 0.6314 -- iter: 11136/24500


Training Step: 175  | total loss: 

0.64087

 | time: 40.917s


| Adam | epoch: 001 | loss: 0.64087 - acc: 0.6355 -- iter: 11200/24500


Training Step: 176  | total loss: 

0.64277

 | time: 41.279s


| Adam | epoch: 001 | loss: 0.64277 - acc: 0.6375 -- iter: 11264/24500


Training Step: 177  | total loss: 

0.65082

 | time: 41.679s


| Adam | epoch: 001 | loss: 0.65082 - acc: 0.6300 -- iter: 11328/24500


Training Step: 178  | total loss: 

0.64924

 | time: 42.033s


| Adam | epoch: 001 | loss: 0.64924 - acc: 0.6358 -- iter: 11392/24500


Training Step: 179  | total loss: 

0.65038

 | time: 42.425s


| Adam | epoch: 001 | loss: 0.65038 - acc: 0.6300 -- iter: 11456/24500


Training Step: 180  | total loss: 

0.65093

 | time: 42.800s


| Adam | epoch: 001 | loss: 0.65093 - acc: 0.6217 -- iter: 11520/24500


Training Step: 181  | total loss: 

0.65202

 | time: 43.202s


| Adam | epoch: 001 | loss: 0.65202 - acc: 0.6205 -- iter: 11584/24500


Training Step: 182  | total loss: 

0.64766

 | time: 43.551s


| Adam | epoch: 001 | loss: 0.64766 - acc: 0.6319 -- iter: 11648/24500


Training Step: 183  | total loss: 

0.65298

 | time: 43.917s


| Adam | epoch: 001 | loss: 0.65298 - acc: 0.6265 -- iter: 11712/24500


Training Step: 184  | total loss: 

0.64654

 | time: 44.282s


| Adam | epoch: 001 | loss: 0.64654 - acc: 0.6326 -- iter: 11776/24500


Training Step: 185  | total loss: 

0.64655

 | time: 44.658s


| Adam | epoch: 001 | loss: 0.64655 - acc: 0.6334 -- iter: 11840/24500


Training Step: 186  | total loss: 

0.64585

 | time: 45.016s


| Adam | epoch: 001 | loss: 0.64585 - acc: 0.6372 -- iter: 11904/24500


Training Step: 187  | total loss: 

0.65137

 | time: 45.374s


| Adam | epoch: 001 | loss: 0.65137 - acc: 0.6329 -- iter: 11968/24500


Training Step: 188  | total loss: 

0.65304

 | time: 45.732s


| Adam | epoch: 001 | loss: 0.65304 - acc: 0.6321 -- iter: 12032/24500


Training Step: 189  | total loss: 

0.64952

 | time: 46.071s


| Adam | epoch: 001 | loss: 0.64952 - acc: 0.6376 -- iter: 12096/24500


Training Step: 190  | total loss: 

0.64917

 | time: 46.422s


| Adam | epoch: 001 | loss: 0.64917 - acc: 0.6395 -- iter: 12160/24500


Training Step: 191  | total loss: 

0.65098

 | time: 46.760s


| Adam | epoch: 001 | loss: 0.65098 - acc: 0.6381 -- iter: 12224/24500


Training Step: 192  | total loss: 

0.65478

 | time: 47.115s


| Adam | epoch: 001 | loss: 0.65478 - acc: 0.6305 -- iter: 12288/24500


Training Step: 193  | total loss: 

0.65674

 | time: 47.476s


| Adam | epoch: 001 | loss: 0.65674 - acc: 0.6268 -- iter: 12352/24500


Training Step: 194  | total loss: 

0.65056

 | time: 47.820s


| Adam | epoch: 001 | loss: 0.65056 - acc: 0.6345 -- iter: 12416/24500


Training Step: 195  | total loss: 

0.64823

 | time: 48.157s


| Adam | epoch: 001 | loss: 0.64823 - acc: 0.6366 -- iter: 12480/24500


Training Step: 196  | total loss: 

0.64599

 | time: 48.508s


| Adam | epoch: 001 | loss: 0.64599 - acc: 0.6402 -- iter: 12544/24500


Training Step: 197  | total loss: 

0.64186

 | time: 48.858s


| Adam | epoch: 001 | loss: 0.64186 - acc: 0.6449 -- iter: 12608/24500


Training Step: 198  | total loss: 

0.63720

 | time: 49.203s


| Adam | epoch: 001 | loss: 0.63720 - acc: 0.6507 -- iter: 12672/24500


Training Step: 199  | total loss: 

0.63599

 | time: 49.551s


| Adam | epoch: 001 | loss: 0.63599 - acc: 0.6497 -- iter: 12736/24500


Training Step: 200  | total loss: 

0.63868

 | time: 49.892s


| Adam | epoch: 001 | loss: 0.63868 - acc: 0.6410 -- iter: 12800/24500


Training Step: 201  | total loss: 

0.63746

 | time: 50.242s


| Adam | epoch: 001 | loss: 0.63746 - acc: 0.6456 -- iter: 12864/24500


Training Step: 202  | total loss: 

0.63322

 | time: 50.577s


| Adam | epoch: 001 | loss: 0.63322 - acc: 0.6529 -- iter: 12928/24500


Training Step: 203  | total loss: 

0.63417

 | time: 50.939s


| Adam | epoch: 001 | loss: 0.63417 - acc: 0.6470 -- iter: 12992/24500


Training Step: 204  | total loss: 

0.62959

 | time: 51.265s


| Adam | epoch: 001 | loss: 0.62959 - acc: 0.6558 -- iter: 13056/24500


Training Step: 205  | total loss: 

0.63399

 | time: 51.603s


| Adam | epoch: 001 | loss: 0.63399 - acc: 0.6496 -- iter: 13120/24500


Training Step: 206  | total loss: 

0.63735

 | time: 51.948s


| Adam | epoch: 001 | loss: 0.63735 - acc: 0.6440 -- iter: 13184/24500


Training Step: 207  | total loss: 

0.63980

 | time: 52.271s


| Adam | epoch: 001 | loss: 0.63980 - acc: 0.6327 -- iter: 13248/24500


Training Step: 208  | total loss: 

0.63619

 | time: 52.610s


| Adam | epoch: 001 | loss: 0.63619 - acc: 0.6382 -- iter: 13312/24500


Training Step: 209  | total loss: 

0.62793

 | time: 52.955s


| Adam | epoch: 001 | loss: 0.62793 - acc: 0.6416 -- iter: 13376/24500


Training Step: 210  | total loss: 

0.62570

 | time: 53.301s


| Adam | epoch: 001 | loss: 0.62570 - acc: 0.6399 -- iter: 13440/24500


Training Step: 211  | total loss: 

0.62463

 | time: 53.642s


| Adam | epoch: 001 | loss: 0.62463 - acc: 0.6384 -- iter: 13504/24500


Training Step: 212  | total loss: 

0.63367

 | time: 53.991s


| Adam | epoch: 001 | loss: 0.63367 - acc: 0.6371 -- iter: 13568/24500


Training Step: 213  | total loss: 

0.63140

 | time: 54.347s


| Adam | epoch: 001 | loss: 0.63140 - acc: 0.6374 -- iter: 13632/24500


Training Step: 214  | total loss: 

0.62942

 | time: 54.703s


| Adam | epoch: 001 | loss: 0.62942 - acc: 0.6362 -- iter: 13696/24500


Training Step: 215  | total loss: 

0.63081

 | time: 55.071s


| Adam | epoch: 001 | loss: 0.63081 - acc: 0.6366 -- iter: 13760/24500


Training Step: 216  | total loss: 

0.62923

 | time: 55.437s


| Adam | epoch: 001 | loss: 0.62923 - acc: 0.6417 -- iter: 13824/24500


Training Step: 217  | total loss: 

0.62639

 | time: 55.792s


| Adam | epoch: 001 | loss: 0.62639 - acc: 0.6447 -- iter: 13888/24500


Training Step: 218  | total loss: 

0.62815

 | time: 56.153s


| Adam | epoch: 001 | loss: 0.62815 - acc: 0.6443 -- iter: 13952/24500


Training Step: 219  | total loss: 

0.62793

 | time: 56.534s


| Adam | epoch: 001 | loss: 0.62793 - acc: 0.6455 -- iter: 14016/24500


Training Step: 220  | total loss: 

0.63028

 | time: 56.901s


| Adam | epoch: 001 | loss: 0.63028 - acc: 0.6419 -- iter: 14080/24500


Training Step: 221  | total loss: 

0.62638

 | time: 57.249s


| Adam | epoch: 001 | loss: 0.62638 - acc: 0.6433 -- iter: 14144/24500


Training Step: 222  | total loss: 

0.61986

 | time: 57.613s


| Adam | epoch: 001 | loss: 0.61986 - acc: 0.6509 -- iter: 14208/24500


Training Step: 223  | total loss: 

0.62270

 | time: 57.982s


| Adam | epoch: 001 | loss: 0.62270 - acc: 0.6436 -- iter: 14272/24500


Training Step: 224  | total loss: 

0.62216

 | time: 58.355s


| Adam | epoch: 001 | loss: 0.62216 - acc: 0.6417 -- iter: 14336/24500


Training Step: 225  | total loss: 

0.62257

 | time: 58.731s


| Adam | epoch: 001 | loss: 0.62257 - acc: 0.6369 -- iter: 14400/24500


Training Step: 226  | total loss: 

0.62148

 | time: 59.074s


| Adam | epoch: 001 | loss: 0.62148 - acc: 0.6420 -- iter: 14464/24500


Training Step: 227  | total loss: 

0.61796

 | time: 59.441s


| Adam | epoch: 001 | loss: 0.61796 - acc: 0.6403 -- iter: 14528/24500


Training Step: 228  | total loss: 

0.62778

 | time: 59.792s


| Adam | epoch: 001 | loss: 0.62778 - acc: 0.6325 -- iter: 14592/24500


Training Step: 229  | total loss: 

0.62507

 | time: 60.157s


| Adam | epoch: 001 | loss: 0.62507 - acc: 0.6380 -- iter: 14656/24500


Training Step: 230  | total loss: 

0.63426

 | time: 60.527s


| Adam | epoch: 001 | loss: 0.63426 - acc: 0.6352 -- iter: 14720/24500


Training Step: 231  | total loss: 

0.63247

 | time: 60.886s


| Adam | epoch: 001 | loss: 0.63247 - acc: 0.6373 -- iter: 14784/24500


Training Step: 232  | total loss: 

0.63291

 | time: 61.233s


| Adam | epoch: 001 | loss: 0.63291 - acc: 0.6392 -- iter: 14848/24500


Training Step: 233  | total loss: 

0.61960

 | time: 61.586s


| Adam | epoch: 001 | loss: 0.61960 - acc: 0.6518 -- iter: 14912/24500


Training Step: 234  | total loss: 

0.61303

 | time: 61.937s


| Adam | epoch: 001 | loss: 0.61303 - acc: 0.6538 -- iter: 14976/24500


Training Step: 235  | total loss: 

0.61061

 | time: 62.290s


| Adam | epoch: 001 | loss: 0.61061 - acc: 0.6619 -- iter: 15040/24500


Training Step: 236  | total loss: 

0.61284

 | time: 62.650s


| Adam | epoch: 001 | loss: 0.61284 - acc: 0.6566 -- iter: 15104/24500


Training Step: 237  | total loss: 

0.60754

 | time: 63.005s


| Adam | epoch: 001 | loss: 0.60754 - acc: 0.6581 -- iter: 15168/24500


Training Step: 238  | total loss: 

0.61747

 | time: 63.367s


| Adam | epoch: 001 | loss: 0.61747 - acc: 0.6501 -- iter: 15232/24500


Training Step: 239  | total loss: 

0.61228

 | time: 63.742s


| Adam | epoch: 001 | loss: 0.61228 - acc: 0.6508 -- iter: 15296/24500


Training Step: 240  | total loss: 

0.62076

 | time: 64.109s


| Adam | epoch: 001 | loss: 0.62076 - acc: 0.6466 -- iter: 15360/24500


Training Step: 241  | total loss: 

0.61597

 | time: 64.493s


| Adam | epoch: 001 | loss: 0.61597 - acc: 0.6476 -- iter: 15424/24500


Training Step: 242  | total loss: 

0.62417

 | time: 64.852s


| Adam | epoch: 001 | loss: 0.62417 - acc: 0.6406 -- iter: 15488/24500


Training Step: 243  | total loss: 

0.62017

 | time: 65.228s


| Adam | epoch: 001 | loss: 0.62017 - acc: 0.6422 -- iter: 15552/24500


Training Step: 244  | total loss: 

0.61497

 | time: 65.603s


| Adam | epoch: 001 | loss: 0.61497 - acc: 0.6514 -- iter: 15616/24500


Training Step: 245  | total loss: 

0.60319

 | time: 65.973s


| Adam | epoch: 001 | loss: 0.60319 - acc: 0.6613 -- iter: 15680/24500


Training Step: 246  | total loss: 

0.60507

 | time: 66.347s


| Adam | epoch: 001 | loss: 0.60507 - acc: 0.6561 -- iter: 15744/24500


Training Step: 247  | total loss: 

0.60807

 | time: 66.721s


| Adam | epoch: 001 | loss: 0.60807 - acc: 0.6530 -- iter: 15808/24500


Training Step: 248  | total loss: 

0.60591

 | time: 67.107s


| Adam | epoch: 001 | loss: 0.60591 - acc: 0.6596 -- iter: 15872/24500


Training Step: 249  | total loss: 

0.60747

 | time: 67.470s


| Adam | epoch: 001 | loss: 0.60747 - acc: 0.6592 -- iter: 15936/24500


Training Step: 250  | total loss: 

0.60529

 | time: 67.849s


| Adam | epoch: 001 | loss: 0.60529 - acc: 0.6589 -- iter: 16000/24500


Training Step: 251  | total loss: 

0.60592

 | time: 68.212s


| Adam | epoch: 001 | loss: 0.60592 - acc: 0.6618 -- iter: 16064/24500


Training Step: 252  | total loss: 

0.60702

 | time: 68.595s


| Adam | epoch: 001 | loss: 0.60702 - acc: 0.6659 -- iter: 16128/24500


Training Step: 253  | total loss: 

0.60955

 | time: 68.958s


| Adam | epoch: 001 | loss: 0.60955 - acc: 0.6556 -- iter: 16192/24500


Training Step: 254  | total loss: 

0.61159

 | time: 69.324s


| Adam | epoch: 001 | loss: 0.61159 - acc: 0.6572 -- iter: 16256/24500


Training Step: 255  | total loss: 

0.60931

 | time: 69.698s


| Adam | epoch: 001 | loss: 0.60931 - acc: 0.6680 -- iter: 16320/24500


Training Step: 256  | total loss: 

0.60364

 | time: 70.072s


| Adam | epoch: 001 | loss: 0.60364 - acc: 0.6747 -- iter: 16384/24500


Training Step: 257  | total loss: 

0.60159

 | time: 70.443s


| Adam | epoch: 001 | loss: 0.60159 - acc: 0.6728 -- iter: 16448/24500


Training Step: 258  | total loss: 

0.61067

 | time: 70.827s


| Adam | epoch: 001 | loss: 0.61067 - acc: 0.6649 -- iter: 16512/24500


Training Step: 259  | total loss: 

0.61274

 | time: 71.197s


| Adam | epoch: 001 | loss: 0.61274 - acc: 0.6656 -- iter: 16576/24500


Training Step: 260  | total loss: 

0.60726

 | time: 71.564s


| Adam | epoch: 001 | loss: 0.60726 - acc: 0.6741 -- iter: 16640/24500


Training Step: 261  | total loss: 

0.61603

 | time: 71.949s


| Adam | epoch: 001 | loss: 0.61603 - acc: 0.6738 -- iter: 16704/24500


Training Step: 262  | total loss: 

0.61915

 | time: 72.330s


| Adam | epoch: 001 | loss: 0.61915 - acc: 0.6658 -- iter: 16768/24500


Training Step: 263  | total loss: 

0.61349

 | time: 72.716s


| Adam | epoch: 001 | loss: 0.61349 - acc: 0.6727 -- iter: 16832/24500


Training Step: 264  | total loss: 

0.61418

 | time: 73.075s


| Adam | epoch: 001 | loss: 0.61418 - acc: 0.6742 -- iter: 16896/24500


Training Step: 265  | total loss: 

0.61463

 | time: 73.459s


| Adam | epoch: 001 | loss: 0.61463 - acc: 0.6708 -- iter: 16960/24500


Training Step: 266  | total loss: 

0.61569

 | time: 73.836s


| Adam | epoch: 001 | loss: 0.61569 - acc: 0.6709 -- iter: 17024/24500


Training Step: 267  | total loss: 

0.61941

 | time: 74.238s


| Adam | epoch: 001 | loss: 0.61941 - acc: 0.6663 -- iter: 17088/24500


Training Step: 268  | total loss: 

0.62513

 | time: 74.604s


| Adam | epoch: 001 | loss: 0.62513 - acc: 0.6606 -- iter: 17152/24500


Training Step: 269  | total loss: 

0.62303

 | time: 74.985s


| Adam | epoch: 001 | loss: 0.62303 - acc: 0.6618 -- iter: 17216/24500


Training Step: 270  | total loss: 

0.62304

 | time: 75.359s


| Adam | epoch: 001 | loss: 0.62304 - acc: 0.6581 -- iter: 17280/24500


Training Step: 271  | total loss: 

0.62398

 | time: 75.719s


| Adam | epoch: 001 | loss: 0.62398 - acc: 0.6579 -- iter: 17344/24500


Training Step: 272  | total loss: 

0.61968

 | time: 76.099s


| Adam | epoch: 001 | loss: 0.61968 - acc: 0.6546 -- iter: 17408/24500


Training Step: 273  | total loss: 

0.62016

 | time: 76.465s


| Adam | epoch: 001 | loss: 0.62016 - acc: 0.6579 -- iter: 17472/24500


Training Step: 274  | total loss: 

0.61425

 | time: 76.851s


| Adam | epoch: 001 | loss: 0.61425 - acc: 0.6624 -- iter: 17536/24500


Training Step: 275  | total loss: 

0.61249

 | time: 77.233s


| Adam | epoch: 001 | loss: 0.61249 - acc: 0.6649 -- iter: 17600/24500


Training Step: 276  | total loss: 

0.61295

 | time: 77.615s


| Adam | epoch: 001 | loss: 0.61295 - acc: 0.6687 -- iter: 17664/24500


Training Step: 277  | total loss: 

0.61250

 | time: 78.009s


| Adam | epoch: 001 | loss: 0.61250 - acc: 0.6659 -- iter: 17728/24500


Training Step: 278  | total loss: 

0.61575

 | time: 78.395s


| Adam | epoch: 001 | loss: 0.61575 - acc: 0.6634 -- iter: 17792/24500


Training Step: 279  | total loss: 

0.61140

 | time: 78.780s


| Adam | epoch: 001 | loss: 0.61140 - acc: 0.6658 -- iter: 17856/24500


Training Step: 280  | total loss: 

0.61785

 | time: 79.136s


| Adam | epoch: 001 | loss: 0.61785 - acc: 0.6586 -- iter: 17920/24500


Training Step: 281  | total loss: 

0.61451

 | time: 79.523s


| Adam | epoch: 001 | loss: 0.61451 - acc: 0.6662 -- iter: 17984/24500


Training Step: 282  | total loss: 

0.60677

 | time: 79.920s


| Adam | epoch: 001 | loss: 0.60677 - acc: 0.6730 -- iter: 18048/24500


Training Step: 283  | total loss: 

0.62240

 | time: 80.297s


| Adam | epoch: 001 | loss: 0.62240 - acc: 0.6651 -- iter: 18112/24500


Training Step: 284  | total loss: 

0.61961

 | time: 80.661s


| Adam | epoch: 001 | loss: 0.61961 - acc: 0.6689 -- iter: 18176/24500


Training Step: 285  | total loss: 

0.61938

 | time: 81.045s


| Adam | epoch: 001 | loss: 0.61938 - acc: 0.6676 -- iter: 18240/24500


Training Step: 286  | total loss: 

0.61988

 | time: 81.438s


| Adam | epoch: 001 | loss: 0.61988 - acc: 0.6680 -- iter: 18304/24500


Training Step: 287  | total loss: 

0.61254

 | time: 81.807s


| Adam | epoch: 001 | loss: 0.61254 - acc: 0.6731 -- iter: 18368/24500


Training Step: 288  | total loss: 

0.60383

 | time: 82.179s


| Adam | epoch: 001 | loss: 0.60383 - acc: 0.6746 -- iter: 18432/24500


Training Step: 289  | total loss: 

0.60436

 | time: 82.532s


| Adam | epoch: 001 | loss: 0.60436 - acc: 0.6743 -- iter: 18496/24500


Training Step: 290  | total loss: 

0.59566

 | time: 82.869s


| Adam | epoch: 001 | loss: 0.59566 - acc: 0.6787 -- iter: 18560/24500


Training Step: 291  | total loss: 

0.59143

 | time: 83.217s


| Adam | epoch: 001 | loss: 0.59143 - acc: 0.6765 -- iter: 18624/24500


Training Step: 292  | total loss: 

0.58562

 | time: 83.596s


| Adam | epoch: 001 | loss: 0.58562 - acc: 0.6885 -- iter: 18688/24500


Training Step: 293  | total loss: 

0.58534

 | time: 83.978s


| Adam | epoch: 001 | loss: 0.58534 - acc: 0.6853 -- iter: 18752/24500


Training Step: 294  | total loss: 

0.58325

 | time: 84.381s


| Adam | epoch: 001 | loss: 0.58325 - acc: 0.6902 -- iter: 18816/24500


Training Step: 295  | total loss: 

0.59313

 | time: 84.760s


| Adam | epoch: 001 | loss: 0.59313 - acc: 0.6868 -- iter: 18880/24500


Training Step: 296  | total loss: 

0.59850

 | time: 85.159s


| Adam | epoch: 001 | loss: 0.59850 - acc: 0.6884 -- iter: 18944/24500


Training Step: 297  | total loss: 

0.59689

 | time: 85.535s


| Adam | epoch: 001 | loss: 0.59689 - acc: 0.6883 -- iter: 19008/24500


Training Step: 298  | total loss: 

0.58680

 | time: 85.910s


| Adam | epoch: 001 | loss: 0.58680 - acc: 0.6898 -- iter: 19072/24500


Training Step: 299  | total loss: 

0.60086

 | time: 86.310s


| Adam | epoch: 001 | loss: 0.60086 - acc: 0.6833 -- iter: 19136/24500


Training Step: 300  | total loss: 

0.60822

 | time: 86.671s


| Adam | epoch: 001 | loss: 0.60822 - acc: 0.6759 -- iter: 19200/24500


Training Step: 301  | total loss: 

0.60225

 | time: 87.060s


| Adam | epoch: 001 | loss: 0.60225 - acc: 0.6818 -- iter: 19264/24500


Training Step: 302  | total loss: 

0.59652

 | time: 87.438s


| Adam | epoch: 001 | loss: 0.59652 - acc: 0.6902 -- iter: 19328/24500


Training Step: 303  | total loss: 

0.59554

 | time: 87.818s


| Adam | epoch: 001 | loss: 0.59554 - acc: 0.6899 -- iter: 19392/24500


Training Step: 304  | total loss: 

0.59905

 | time: 88.202s


| Adam | epoch: 001 | loss: 0.59905 - acc: 0.6834 -- iter: 19456/24500


Training Step: 305  | total loss: 

0.59635

 | time: 88.569s


| Adam | epoch: 001 | loss: 0.59635 - acc: 0.6838 -- iter: 19520/24500


Training Step: 306  | total loss: 

0.59437

 | time: 88.951s


| Adam | epoch: 001 | loss: 0.59437 - acc: 0.6858 -- iter: 19584/24500


Training Step: 307  | total loss: 

0.59243

 | time: 89.342s


| Adam | epoch: 001 | loss: 0.59243 - acc: 0.6828 -- iter: 19648/24500


Training Step: 308  | total loss: 

0.58364

 | time: 89.717s


| Adam | epoch: 001 | loss: 0.58364 - acc: 0.6911 -- iter: 19712/24500


Training Step: 309  | total loss: 

0.58128

 | time: 90.096s


| Adam | epoch: 001 | loss: 0.58128 - acc: 0.6892 -- iter: 19776/24500


Training Step: 310  | total loss: 

0.59022

 | time: 90.464s


| Adam | epoch: 001 | loss: 0.59022 - acc: 0.6796 -- iter: 19840/24500


Training Step: 311  | total loss: 

0.58777

 | time: 90.849s


| Adam | epoch: 001 | loss: 0.58777 - acc: 0.6820 -- iter: 19904/24500


Training Step: 312  | total loss: 

0.58150

 | time: 91.244s


| Adam | epoch: 001 | loss: 0.58150 - acc: 0.6810 -- iter: 19968/24500


Training Step: 313  | total loss: 

0.58694

 | time: 91.628s


| Adam | epoch: 001 | loss: 0.58694 - acc: 0.6832 -- iter: 20032/24500


Training Step: 314  | total loss: 

0.58418

 | time: 92.027s


| Adam | epoch: 001 | loss: 0.58418 - acc: 0.6789 -- iter: 20096/24500


Training Step: 315  | total loss: 

0.58654

 | time: 92.390s


| Adam | epoch: 001 | loss: 0.58654 - acc: 0.6751 -- iter: 20160/24500


Training Step: 316  | total loss: 

0.58910

 | time: 92.757s


| Adam | epoch: 001 | loss: 0.58910 - acc: 0.6795 -- iter: 20224/24500


Training Step: 317  | total loss: 

0.58820

 | time: 93.138s


| Adam | epoch: 001 | loss: 0.58820 - acc: 0.6850 -- iter: 20288/24500


Training Step: 318  | total loss: 

0.58570

 | time: 93.508s


| Adam | epoch: 001 | loss: 0.58570 - acc: 0.6930 -- iter: 20352/24500


Training Step: 319  | total loss: 

0.58285

 | time: 93.907s


| Adam | epoch: 001 | loss: 0.58285 - acc: 0.6972 -- iter: 20416/24500


Training Step: 320  | total loss: 

0.59195

 | time: 94.300s


| Adam | epoch: 001 | loss: 0.59195 - acc: 0.6978 -- iter: 20480/24500


Training Step: 321  | total loss: 

0.58686

 | time: 94.697s


| Adam | epoch: 001 | loss: 0.58686 - acc: 0.6952 -- iter: 20544/24500


Training Step: 322  | total loss: 

0.59195

 | time: 95.080s


| Adam | epoch: 001 | loss: 0.59195 - acc: 0.6944 -- iter: 20608/24500


Training Step: 323  | total loss: 

0.58938

 | time: 95.463s


| Adam | epoch: 001 | loss: 0.58938 - acc: 0.6968 -- iter: 20672/24500


Training Step: 324  | total loss: 

0.58929

 | time: 95.846s


| Adam | epoch: 001 | loss: 0.58929 - acc: 0.7021 -- iter: 20736/24500


Training Step: 325  | total loss: 

0.58826

 | time: 96.244s


| Adam | epoch: 001 | loss: 0.58826 - acc: 0.7007 -- iter: 20800/24500


Training Step: 326  | total loss: 

0.58153

 | time: 96.625s


| Adam | epoch: 001 | loss: 0.58153 - acc: 0.7009 -- iter: 20864/24500


Training Step: 327  | total loss: 

0.58112

 | time: 97.008s


| Adam | epoch: 001 | loss: 0.58112 - acc: 0.7027 -- iter: 20928/24500


Training Step: 328  | total loss: 

0.59443

 | time: 97.386s


| Adam | epoch: 001 | loss: 0.59443 - acc: 0.6996 -- iter: 20992/24500


Training Step: 329  | total loss: 

0.60105

 | time: 97.770s


| Adam | epoch: 001 | loss: 0.60105 - acc: 0.6844 -- iter: 21056/24500


Training Step: 330  | total loss: 

0.60112

 | time: 98.170s


| Adam | epoch: 001 | loss: 0.60112 - acc: 0.6800 -- iter: 21120/24500


Training Step: 331  | total loss: 

0.60707

 | time: 98.569s


| Adam | epoch: 001 | loss: 0.60707 - acc: 0.6714 -- iter: 21184/24500


Training Step: 332  | total loss: 

0.60102

 | time: 98.949s


| Adam | epoch: 001 | loss: 0.60102 - acc: 0.6761 -- iter: 21248/24500


Training Step: 333  | total loss: 

0.59890

 | time: 99.350s


| Adam | epoch: 001 | loss: 0.59890 - acc: 0.6819 -- iter: 21312/24500


Training Step: 334  | total loss: 

0.60142

 | time: 99.733s


| Adam | epoch: 001 | loss: 0.60142 - acc: 0.6762 -- iter: 21376/24500


Training Step: 335  | total loss: 

0.59611

 | time: 100.117s


| Adam | epoch: 001 | loss: 0.59611 - acc: 0.6789 -- iter: 21440/24500


Training Step: 336  | total loss: 

0.59446

 | time: 100.510s


| Adam | epoch: 001 | loss: 0.59446 - acc: 0.6735 -- iter: 21504/24500


Training Step: 337  | total loss: 

0.59540

 | time: 100.917s


| Adam | epoch: 001 | loss: 0.59540 - acc: 0.6796 -- iter: 21568/24500


Training Step: 338  | total loss: 

0.59244

 | time: 101.296s


| Adam | epoch: 001 | loss: 0.59244 - acc: 0.6820 -- iter: 21632/24500


Training Step: 339  | total loss: 

0.59212

 | time: 101.680s


| Adam | epoch: 001 | loss: 0.59212 - acc: 0.6872 -- iter: 21696/24500


Training Step: 340  | total loss: 

0.59038

 | time: 102.052s


| Adam | epoch: 001 | loss: 0.59038 - acc: 0.6904 -- iter: 21760/24500


Training Step: 341  | total loss: 

0.58866

 | time: 102.451s


| Adam | epoch: 001 | loss: 0.58866 - acc: 0.6901 -- iter: 21824/24500


Training Step: 342  | total loss: 

0.58897

 | time: 102.832s


| Adam | epoch: 001 | loss: 0.58897 - acc: 0.6914 -- iter: 21888/24500


Training Step: 343  | total loss: 

0.59152

 | time: 103.215s


| Adam | epoch: 001 | loss: 0.59152 - acc: 0.6894 -- iter: 21952/24500


Training Step: 344  | total loss: 

0.58379

 | time: 103.597s


| Adam | epoch: 001 | loss: 0.58379 - acc: 0.6939 -- iter: 22016/24500


Training Step: 345  | total loss: 

0.59822

 | time: 103.998s


| Adam | epoch: 001 | loss: 0.59822 - acc: 0.6808 -- iter: 22080/24500


Training Step: 346  | total loss: 

0.60080

 | time: 104.392s


| Adam | epoch: 001 | loss: 0.60080 - acc: 0.6799 -- iter: 22144/24500


Training Step: 347  | total loss: 

0.58954

 | time: 104.761s


| Adam | epoch: 001 | loss: 0.58954 - acc: 0.6853 -- iter: 22208/24500


Training Step: 348  | total loss: 

0.59505

 | time: 105.153s


| Adam | epoch: 001 | loss: 0.59505 - acc: 0.6840 -- iter: 22272/24500


Training Step: 349  | total loss: 

0.59362

 | time: 105.538s


| Adam | epoch: 001 | loss: 0.59362 - acc: 0.6859 -- iter: 22336/24500


Training Step: 350  | total loss: 

0.58532

 | time: 105.937s


| Adam | epoch: 001 | loss: 0.58532 - acc: 0.6939 -- iter: 22400/24500


Training Step: 351  | total loss: 

0.57651

 | time: 106.322s


| Adam | epoch: 001 | loss: 0.57651 - acc: 0.7026 -- iter: 22464/24500


Training Step: 352  | total loss: 

0.59846

 | time: 106.688s


| Adam | epoch: 001 | loss: 0.59846 - acc: 0.6855 -- iter: 22528/24500


Training Step: 353  | total loss: 

0.59030

 | time: 107.058s


| Adam | epoch: 001 | loss: 0.59030 - acc: 0.6872 -- iter: 22592/24500


Training Step: 354  | total loss: 

0.58586

 | time: 107.456s


| Adam | epoch: 001 | loss: 0.58586 - acc: 0.6888 -- iter: 22656/24500


Training Step: 355  | total loss: 

0.59220

 | time: 107.857s


| Adam | epoch: 001 | loss: 0.59220 - acc: 0.6840 -- iter: 22720/24500


Training Step: 356  | total loss: 

0.58054

 | time: 108.239s


| Adam | epoch: 001 | loss: 0.58054 - acc: 0.6906 -- iter: 22784/24500


Training Step: 357  | total loss: 

0.58558

 | time: 108.618s


| Adam | epoch: 001 | loss: 0.58558 - acc: 0.6872 -- iter: 22848/24500


Training Step: 358  | total loss: 

0.58952

 | time: 109.033s


| Adam | epoch: 001 | loss: 0.58952 - acc: 0.6888 -- iter: 22912/24500


Training Step: 359  | total loss: 

0.59172

 | time: 109.416s


| Adam | epoch: 001 | loss: 0.59172 - acc: 0.6855 -- iter: 22976/24500


Training Step: 360  | total loss: 

0.59826

 | time: 109.800s


| Adam | epoch: 001 | loss: 0.59826 - acc: 0.6810 -- iter: 23040/24500


Training Step: 361  | total loss: 

0.59590

 | time: 110.175s


| Adam | epoch: 001 | loss: 0.59590 - acc: 0.6817 -- iter: 23104/24500


Training Step: 362  | total loss: 

0.59522

 | time: 110.561s


| Adam | epoch: 001 | loss: 0.59522 - acc: 0.6854 -- iter: 23168/24500


Training Step: 363  | total loss: 

0.58773

 | time: 110.960s


| Adam | epoch: 001 | loss: 0.58773 - acc: 0.6903 -- iter: 23232/24500


Training Step: 364  | total loss: 

0.58282

 | time: 111.318s


| Adam | epoch: 001 | loss: 0.58282 - acc: 0.6963 -- iter: 23296/24500


Training Step: 365  | total loss: 

0.58077

 | time: 111.701s


| Adam | epoch: 001 | loss: 0.58077 - acc: 0.6938 -- iter: 23360/24500


Training Step: 366  | total loss: 

0.58873

 | time: 112.088s


| Adam | epoch: 001 | loss: 0.58873 - acc: 0.6869 -- iter: 23424/24500


Training Step: 367  | total loss: 

0.59139

 | time: 112.480s


| Adam | epoch: 001 | loss: 0.59139 - acc: 0.6776 -- iter: 23488/24500


Training Step: 368  | total loss: 

0.58989

 | time: 112.879s


| Adam | epoch: 001 | loss: 0.58989 - acc: 0.6786 -- iter: 23552/24500


Training Step: 369  | total loss: 

0.58580

 | time: 113.270s


| Adam | epoch: 001 | loss: 0.58580 - acc: 0.6779 -- iter: 23616/24500


Training Step: 370  | total loss: 

0.58686

 | time: 113.654s


| Adam | epoch: 001 | loss: 0.58686 - acc: 0.6773 -- iter: 23680/24500


Training Step: 371  | total loss: 

0.58688

 | time: 114.029s


| Adam | epoch: 001 | loss: 0.58688 - acc: 0.6721 -- iter: 23744/24500


Training Step: 372  | total loss: 

0.59021

 | time: 114.416s


| Adam | epoch: 001 | loss: 0.59021 - acc: 0.6783 -- iter: 23808/24500


Training Step: 373  | total loss: 

0.59012

 | time: 114.800s


| Adam | epoch: 001 | loss: 0.59012 - acc: 0.6824 -- iter: 23872/24500


Training Step: 374  | total loss: 

0.58681

 | time: 115.214s


| Adam | epoch: 001 | loss: 0.58681 - acc: 0.6829 -- iter: 23936/24500


Training Step: 375  | total loss: 

0.58162

 | time: 115.595s


| Adam | epoch: 001 | loss: 0.58162 - acc: 0.6896 -- iter: 24000/24500


Training Step: 376  | total loss: 

0.58321

 | time: 115.979s


| Adam | epoch: 001 | loss: 0.58321 - acc: 0.6847 -- iter: 24064/24500


Training Step: 377  | total loss: 

0.58546

 | time: 116.365s


| Adam | epoch: 001 | loss: 0.58546 - acc: 0.6850 -- iter: 24128/24500


Training Step: 378  | total loss: 

0.58926

 | time: 116.778s


| Adam | epoch: 001 | loss: 0.58926 - acc: 0.6790 -- iter: 24192/24500


Training Step: 379  | total loss: 

0.58318

 | time: 117.170s


| Adam | epoch: 001 | loss: 0.58318 - acc: 0.6861 -- iter: 24256/24500


Training Step: 380  | total loss: 

0.57388

 | time: 117.576s


| Adam | epoch: 001 | loss: 0.57388 - acc: 0.6956 -- iter: 24320/24500


Training Step: 381  | total loss: 

0.57273

 | time: 117.900s


| Adam | epoch: 001 | loss: 0.57273 - acc: 0.6963 -- iter: 24384/24500


Training Step: 382  | total loss: 

0.57399

 | time: 118.239s


| Adam | epoch: 001 | loss: 0.57399 - acc: 0.6955 -- iter: 24448/24500


Training Step: 383  | total loss: 

0.56411

 | time: 119.586s


| Adam | epoch: 001 | loss: 0.56411 - acc: 0.7025 | val_loss: 0.60984 - val_acc: 0.6700 -- iter: 24500/24500
--


Training Step: 384  | total loss: 

0.56161

 | time: 0.227s


| Adam | epoch: 002 | loss: 0.56161 - acc: 0.7015 -- iter: 00064/24500


Training Step: 385  | total loss: 

0.55845

 | time: 0.543s


| Adam | epoch: 002 | loss: 0.55845 - acc: 0.7025 -- iter: 00128/24500


Training Step: 386  | total loss: 

0.56459

 | time: 0.817s


| Adam | epoch: 002 | loss: 0.56459 - acc: 0.6978 -- iter: 00192/24500


Training Step: 387  | total loss: 

0.55108

 | time: 1.100s


| Adam | epoch: 002 | loss: 0.55108 - acc: 0.7093 -- iter: 00256/24500


Training Step: 388  | total loss: 

0.54932

 | time: 1.376s


| Adam | epoch: 002 | loss: 0.54932 - acc: 0.7134 -- iter: 00320/24500


Training Step: 389  | total loss: 

0.56173

 | time: 1.634s


| Adam | epoch: 002 | loss: 0.56173 - acc: 0.7092 -- iter: 00384/24500


Training Step: 390  | total loss: 

0.55768

 | time: 1.897s


| Adam | epoch: 002 | loss: 0.55768 - acc: 0.7086 -- iter: 00448/24500


Training Step: 391  | total loss: 

0.56486

 | time: 2.168s


| Adam | epoch: 002 | loss: 0.56486 - acc: 0.6987 -- iter: 00512/24500


Training Step: 392  | total loss: 

0.57064

 | time: 2.425s


| Adam | epoch: 002 | loss: 0.57064 - acc: 0.6898 -- iter: 00576/24500


Training Step: 393  | total loss: 

0.58143

 | time: 2.699s


| Adam | epoch: 002 | loss: 0.58143 - acc: 0.6911 -- iter: 00640/24500


Training Step: 394  | total loss: 

0.60722

 | time: 2.955s


| Adam | epoch: 002 | loss: 0.60722 - acc: 0.6798 -- iter: 00704/24500


Training Step: 395  | total loss: 

0.61175

 | time: 3.214s


| Adam | epoch: 002 | loss: 0.61175 - acc: 0.6790 -- iter: 00768/24500


Training Step: 396  | total loss: 

0.60782

 | time: 3.476s


| Adam | epoch: 002 | loss: 0.60782 - acc: 0.6845 -- iter: 00832/24500


Training Step: 397  | total loss: 

0.60162

 | time: 3.744s


| Adam | epoch: 002 | loss: 0.60162 - acc: 0.6848 -- iter: 00896/24500


Training Step: 398  | total loss: 

0.59868

 | time: 4.016s


| Adam | epoch: 002 | loss: 0.59868 - acc: 0.6898 -- iter: 00960/24500


Training Step: 399  | total loss: 

0.60395

 | time: 4.286s


| Adam | epoch: 002 | loss: 0.60395 - acc: 0.6818 -- iter: 01024/24500


Training Step: 400  | total loss: 

0.60775

 | time: 4.564s


| Adam | epoch: 002 | loss: 0.60775 - acc: 0.6808 -- iter: 01088/24500


Training Step: 401  | total loss: 

0.60294

 | time: 4.832s


| Adam | epoch: 002 | loss: 0.60294 - acc: 0.6814 -- iter: 01152/24500


Training Step: 402  | total loss: 

0.60078

 | time: 5.121s


| Adam | epoch: 002 | loss: 0.60078 - acc: 0.6758 -- iter: 01216/24500


Training Step: 403  | total loss: 

0.59755

 | time: 5.395s


| Adam | epoch: 002 | loss: 0.59755 - acc: 0.6817 -- iter: 01280/24500


Training Step: 404  | total loss: 

0.59653

 | time: 5.656s


| Adam | epoch: 002 | loss: 0.59653 - acc: 0.6885 -- iter: 01344/24500


Training Step: 405  | total loss: 

0.60180

 | time: 5.926s


| Adam | epoch: 002 | loss: 0.60180 - acc: 0.6837 -- iter: 01408/24500


Training Step: 406  | total loss: 

0.60447

 | time: 6.194s


| Adam | epoch: 002 | loss: 0.60447 - acc: 0.6810 -- iter: 01472/24500


Training Step: 407  | total loss: 

0.60555

 | time: 6.482s


| Adam | epoch: 002 | loss: 0.60555 - acc: 0.6769 -- iter: 01536/24500


Training Step: 408  | total loss: 

0.60564

 | time: 6.753s


| Adam | epoch: 002 | loss: 0.60564 - acc: 0.6764 -- iter: 01600/24500


Training Step: 409  | total loss: 

0.60509

 | time: 7.035s


| Adam | epoch: 002 | loss: 0.60509 - acc: 0.6791 -- iter: 01664/24500


Training Step: 410  | total loss: 

0.60677

 | time: 7.296s


| Adam | epoch: 002 | loss: 0.60677 - acc: 0.6768 -- iter: 01728/24500


Training Step: 411  | total loss: 

0.61271

 | time: 7.568s


| Adam | epoch: 002 | loss: 0.61271 - acc: 0.6654 -- iter: 01792/24500


Training Step: 412  | total loss: 

0.61071

 | time: 7.835s


| Adam | epoch: 002 | loss: 0.61071 - acc: 0.6723 -- iter: 01856/24500


Training Step: 413  | total loss: 

0.61469

 | time: 8.107s


| Adam | epoch: 002 | loss: 0.61469 - acc: 0.6660 -- iter: 01920/24500


Training Step: 414  | total loss: 

0.60908

 | time: 8.385s


| Adam | epoch: 002 | loss: 0.60908 - acc: 0.6713 -- iter: 01984/24500


Training Step: 415  | total loss: 

0.59599

 | time: 8.653s


| Adam | epoch: 002 | loss: 0.59599 - acc: 0.6823 -- iter: 02048/24500


Training Step: 416  | total loss: 

0.59971

 | time: 8.930s


| Adam | epoch: 002 | loss: 0.59971 - acc: 0.6781 -- iter: 02112/24500


Training Step: 417  | total loss: 

0.60514

 | time: 9.210s


| Adam | epoch: 002 | loss: 0.60514 - acc: 0.6728 -- iter: 02176/24500


Training Step: 418  | total loss: 

0.60677

 | time: 9.480s


| Adam | epoch: 002 | loss: 0.60677 - acc: 0.6743 -- iter: 02240/24500


Training Step: 419  | total loss: 

0.60371

 | time: 9.748s


| Adam | epoch: 002 | loss: 0.60371 - acc: 0.6771 -- iter: 02304/24500


Training Step: 420  | total loss: 

0.60844

 | time: 10.014s


| Adam | epoch: 002 | loss: 0.60844 - acc: 0.6751 -- iter: 02368/24500


Training Step: 421  | total loss: 

0.60713

 | time: 10.309s


| Adam | epoch: 002 | loss: 0.60713 - acc: 0.6747 -- iter: 02432/24500


Training Step: 422  | total loss: 

0.60666

 | time: 10.580s


| Adam | epoch: 002 | loss: 0.60666 - acc: 0.6651 -- iter: 02496/24500


Training Step: 423  | total loss: 

0.60521

 | time: 10.849s


| Adam | epoch: 002 | loss: 0.60521 - acc: 0.6642 -- iter: 02560/24500


Training Step: 424  | total loss: 

0.60069

 | time: 11.086s


| Adam | epoch: 002 | loss: 0.60069 - acc: 0.6681 -- iter: 02624/24500


Training Step: 425  | total loss: 

0.60776

 | time: 11.336s


| Adam | epoch: 002 | loss: 0.60776 - acc: 0.6638 -- iter: 02688/24500


Training Step: 426  | total loss: 

0.60671

 | time: 11.575s


| Adam | epoch: 002 | loss: 0.60671 - acc: 0.6693 -- iter: 02752/24500


Training Step: 427  | total loss: 

0.60014

 | time: 11.809s


| Adam | epoch: 002 | loss: 0.60014 - acc: 0.6711 -- iter: 02816/24500


Training Step: 428  | total loss: 

0.58895

 | time: 12.045s


| Adam | epoch: 002 | loss: 0.58895 - acc: 0.6837 -- iter: 02880/24500


Training Step: 429  | total loss: 

0.58928

 | time: 12.290s


| Adam | epoch: 002 | loss: 0.58928 - acc: 0.6794 -- iter: 02944/24500


Training Step: 430  | total loss: 

0.58193

 | time: 12.528s


| Adam | epoch: 002 | loss: 0.58193 - acc: 0.6896 -- iter: 03008/24500


Training Step: 431  | total loss: 

0.57960

 | time: 12.781s


| Adam | epoch: 002 | loss: 0.57960 - acc: 0.6862 -- iter: 03072/24500


Training Step: 432  | total loss: 

0.58263

 | time: 13.029s


| Adam | epoch: 002 | loss: 0.58263 - acc: 0.6864 -- iter: 03136/24500


Training Step: 433  | total loss: 

0.57993

 | time: 13.272s


| Adam | epoch: 002 | loss: 0.57993 - acc: 0.6943 -- iter: 03200/24500


Training Step: 434  | total loss: 

0.58800

 | time: 13.524s


| Adam | epoch: 002 | loss: 0.58800 - acc: 0.6827 -- iter: 03264/24500


Training Step: 435  | total loss: 

0.57907

 | time: 13.773s


| Adam | epoch: 002 | loss: 0.57907 - acc: 0.6894 -- iter: 03328/24500


Training Step: 436  | total loss: 

0.57762

 | time: 14.014s


| Adam | epoch: 002 | loss: 0.57762 - acc: 0.6830 -- iter: 03392/24500


Training Step: 437  | total loss: 

0.57793

 | time: 14.264s


| Adam | epoch: 002 | loss: 0.57793 - acc: 0.6819 -- iter: 03456/24500


Training Step: 438  | total loss: 

0.57807

 | time: 14.511s


| Adam | epoch: 002 | loss: 0.57807 - acc: 0.6871 -- iter: 03520/24500


Training Step: 439  | total loss: 

0.57657

 | time: 14.758s


| Adam | epoch: 002 | loss: 0.57657 - acc: 0.6903 -- iter: 03584/24500


Training Step: 440  | total loss: 

0.57395

 | time: 15.001s


| Adam | epoch: 002 | loss: 0.57395 - acc: 0.6978 -- iter: 03648/24500


Training Step: 441  | total loss: 

0.56887

 | time: 15.246s


| Adam | epoch: 002 | loss: 0.56887 - acc: 0.7015 -- iter: 03712/24500


Training Step: 442  | total loss: 

0.57509

 | time: 15.497s


| Adam | epoch: 002 | loss: 0.57509 - acc: 0.7016 -- iter: 03776/24500


Training Step: 443  | total loss: 

0.57051

 | time: 15.749s


| Adam | epoch: 002 | loss: 0.57051 - acc: 0.7049 -- iter: 03840/24500


Training Step: 444  | total loss: 

0.56069

 | time: 15.994s


| Adam | epoch: 002 | loss: 0.56069 - acc: 0.7172 -- iter: 03904/24500


Training Step: 445  | total loss: 

0.55723

 | time: 16.245s


| Adam | epoch: 002 | loss: 0.55723 - acc: 0.7205 -- iter: 03968/24500


Training Step: 446  | total loss: 

0.55892

 | time: 16.492s


| Adam | epoch: 002 | loss: 0.55892 - acc: 0.7172 -- iter: 04032/24500


Training Step: 447  | total loss: 

0.55938

 | time: 16.740s


| Adam | epoch: 002 | loss: 0.55938 - acc: 0.7142 -- iter: 04096/24500


Training Step: 448  | total loss: 

0.55240

 | time: 16.985s


| Adam | epoch: 002 | loss: 0.55240 - acc: 0.7209 -- iter: 04160/24500


Training Step: 449  | total loss: 

0.54848

 | time: 17.238s


| Adam | epoch: 002 | loss: 0.54848 - acc: 0.7254 -- iter: 04224/24500


Training Step: 450  | total loss: 

0.54741

 | time: 17.484s


| Adam | epoch: 002 | loss: 0.54741 - acc: 0.7294 -- iter: 04288/24500


Training Step: 451  | total loss: 

0.54734

 | time: 17.717s


| Adam | epoch: 002 | loss: 0.54734 - acc: 0.7268 -- iter: 04352/24500


Training Step: 452  | total loss: 

0.54251

 | time: 17.961s


| Adam | epoch: 002 | loss: 0.54251 - acc: 0.7369 -- iter: 04416/24500


Training Step: 453  | total loss: 

0.54483

 | time: 18.197s


| Adam | epoch: 002 | loss: 0.54483 - acc: 0.7367 -- iter: 04480/24500


Training Step: 454  | total loss: 

0.57258

 | time: 18.440s


| Adam | epoch: 002 | loss: 0.57258 - acc: 0.7224 -- iter: 04544/24500


Training Step: 455  | total loss: 

0.56826

 | time: 18.685s


| Adam | epoch: 002 | loss: 0.56826 - acc: 0.7251 -- iter: 04608/24500


Training Step: 456  | total loss: 

0.56960

 | time: 18.923s


| Adam | epoch: 002 | loss: 0.56960 - acc: 0.7229 -- iter: 04672/24500


Training Step: 457  | total loss: 

0.57272

 | time: 19.160s


| Adam | epoch: 002 | loss: 0.57272 - acc: 0.7163 -- iter: 04736/24500


Training Step: 458  | total loss: 

0.58532

 | time: 19.404s


| Adam | epoch: 002 | loss: 0.58532 - acc: 0.7071 -- iter: 04800/24500


Training Step: 459  | total loss: 

0.58461

 | time: 19.649s


| Adam | epoch: 002 | loss: 0.58461 - acc: 0.7052 -- iter: 04864/24500


Training Step: 460  | total loss: 

0.59180

 | time: 19.883s


| Adam | epoch: 002 | loss: 0.59180 - acc: 0.7065 -- iter: 04928/24500


Training Step: 461  | total loss: 

0.58601

 | time: 20.128s


| Adam | epoch: 002 | loss: 0.58601 - acc: 0.7078 -- iter: 04992/24500


Training Step: 462  | total loss: 

0.58399

 | time: 20.379s


| Adam | epoch: 002 | loss: 0.58399 - acc: 0.7104 -- iter: 05056/24500


Training Step: 463  | total loss: 

0.58565

 | time: 20.614s


| Adam | epoch: 002 | loss: 0.58565 - acc: 0.7066 -- iter: 05120/24500


Training Step: 464  | total loss: 

0.58763

 | time: 20.845s


| Adam | epoch: 002 | loss: 0.58763 - acc: 0.7078 -- iter: 05184/24500


Training Step: 465  | total loss: 

0.59253

 | time: 21.092s


| Adam | epoch: 002 | loss: 0.59253 - acc: 0.7011 -- iter: 05248/24500


Training Step: 466  | total loss: 

0.59306

 | time: 21.341s


| Adam | epoch: 002 | loss: 0.59306 - acc: 0.6997 -- iter: 05312/24500


Training Step: 467  | total loss: 

0.58682

 | time: 21.583s


| Adam | epoch: 002 | loss: 0.58682 - acc: 0.7016 -- iter: 05376/24500


Training Step: 468  | total loss: 

0.58759

 | time: 21.828s


| Adam | epoch: 002 | loss: 0.58759 - acc: 0.6940 -- iter: 05440/24500


Training Step: 469  | total loss: 

0.58852

 | time: 22.074s


| Adam | epoch: 002 | loss: 0.58852 - acc: 0.6917 -- iter: 05504/24500


Training Step: 470  | total loss: 

0.58996

 | time: 22.314s


| Adam | epoch: 002 | loss: 0.58996 - acc: 0.6898 -- iter: 05568/24500


Training Step: 471  | total loss: 

0.58546

 | time: 22.561s


| Adam | epoch: 002 | loss: 0.58546 - acc: 0.6927 -- iter: 05632/24500


Training Step: 472  | total loss: 

0.57725

 | time: 22.806s


| Adam | epoch: 002 | loss: 0.57725 - acc: 0.7015 -- iter: 05696/24500


Training Step: 473  | total loss: 

0.56970

 | time: 23.045s


| Adam | epoch: 002 | loss: 0.56970 - acc: 0.7095 -- iter: 05760/24500


Training Step: 474  | total loss: 

0.56244

 | time: 23.284s


| Adam | epoch: 002 | loss: 0.56244 - acc: 0.7120 -- iter: 05824/24500


Training Step: 475  | total loss: 

0.57125

 | time: 23.532s


| Adam | epoch: 002 | loss: 0.57125 - acc: 0.7095 -- iter: 05888/24500


Training Step: 476  | total loss: 

0.58066

 | time: 23.764s


| Adam | epoch: 002 | loss: 0.58066 - acc: 0.6995 -- iter: 05952/24500


Training Step: 477  | total loss: 

0.57311

 | time: 23.999s


| Adam | epoch: 002 | loss: 0.57311 - acc: 0.7061 -- iter: 06016/24500


Training Step: 478  | total loss: 

0.57426

 | time: 24.241s


| Adam | epoch: 002 | loss: 0.57426 - acc: 0.6996 -- iter: 06080/24500


Training Step: 479  | total loss: 

0.57332

 | time: 24.493s


| Adam | epoch: 002 | loss: 0.57332 - acc: 0.7015 -- iter: 06144/24500


Training Step: 480  | total loss: 

0.56881

 | time: 24.742s


| Adam | epoch: 002 | loss: 0.56881 - acc: 0.7079 -- iter: 06208/24500


Training Step: 481  | total loss: 

0.56547

 | time: 24.989s


| Adam | epoch: 002 | loss: 0.56547 - acc: 0.7106 -- iter: 06272/24500


Training Step: 482  | total loss: 

0.56632

 | time: 25.238s


| Adam | epoch: 002 | loss: 0.56632 - acc: 0.7129 -- iter: 06336/24500


Training Step: 483  | total loss: 

0.56277

 | time: 25.487s


| Adam | epoch: 002 | loss: 0.56277 - acc: 0.7166 -- iter: 06400/24500


Training Step: 484  | total loss: 

0.56594

 | time: 25.733s


| Adam | epoch: 002 | loss: 0.56594 - acc: 0.7106 -- iter: 06464/24500


Training Step: 485  | total loss: 

0.56819

 | time: 25.980s


| Adam | epoch: 002 | loss: 0.56819 - acc: 0.7036 -- iter: 06528/24500


Training Step: 486  | total loss: 

0.56504

 | time: 26.227s


| Adam | epoch: 002 | loss: 0.56504 - acc: 0.7082 -- iter: 06592/24500


Training Step: 487  | total loss: 

0.56027

 | time: 26.467s


| Adam | epoch: 002 | loss: 0.56027 - acc: 0.7140 -- iter: 06656/24500


Training Step: 488  | total loss: 

0.55466

 | time: 26.708s


| Adam | epoch: 002 | loss: 0.55466 - acc: 0.7176 -- iter: 06720/24500


Training Step: 489  | total loss: 

0.55002

 | time: 26.950s


| Adam | epoch: 002 | loss: 0.55002 - acc: 0.7146 -- iter: 06784/24500


Training Step: 490  | total loss: 

0.58103

 | time: 27.193s


| Adam | epoch: 002 | loss: 0.58103 - acc: 0.7056 -- iter: 06848/24500


Training Step: 491  | total loss: 

0.59211

 | time: 27.431s


| Adam | epoch: 002 | loss: 0.59211 - acc: 0.7007 -- iter: 06912/24500


Training Step: 492  | total loss: 

0.58755

 | time: 27.663s


| Adam | epoch: 002 | loss: 0.58755 - acc: 0.6994 -- iter: 06976/24500


Training Step: 493  | total loss: 

0.57545

 | time: 27.903s


| Adam | epoch: 002 | loss: 0.57545 - acc: 0.7122 -- iter: 07040/24500


Training Step: 494  | total loss: 

0.57131

 | time: 28.154s


| Adam | epoch: 002 | loss: 0.57131 - acc: 0.7176 -- iter: 07104/24500


Training Step: 495  | total loss: 

0.56957

 | time: 28.386s


| Adam | epoch: 002 | loss: 0.56957 - acc: 0.7208 -- iter: 07168/24500


Training Step: 496  | total loss: 

0.56900

 | time: 28.624s


| Adam | epoch: 002 | loss: 0.56900 - acc: 0.7175 -- iter: 07232/24500


Training Step: 497  | total loss: 

0.57010

 | time: 28.871s


| Adam | epoch: 002 | loss: 0.57010 - acc: 0.7161 -- iter: 07296/24500


Training Step: 498  | total loss: 

0.56341

 | time: 29.107s


| Adam | epoch: 002 | loss: 0.56341 - acc: 0.7241 -- iter: 07360/24500


Training Step: 499  | total loss: 

0.55154

 | time: 29.347s


| Adam | epoch: 002 | loss: 0.55154 - acc: 0.7267 -- iter: 07424/24500


Training Step: 500  | total loss: 

0.54711

 | time: 30.596s


| Adam | epoch: 002 | loss: 0.54711 - acc: 0.7275 | val_loss: 0.56637 - val_acc: 0.7260 -- iter: 07488/24500
--


Training Step: 501  | total loss: 

0.54441

 | time: 30.883s


| Adam | epoch: 002 | loss: 0.54441 - acc: 0.7313 -- iter: 07552/24500


Training Step: 502  | total loss: 

0.54456

 | time: 31.120s


| Adam | epoch: 002 | loss: 0.54456 - acc: 0.7269 -- iter: 07616/24500


Training Step: 503  | total loss: 

0.54464

 | time: 31.359s


| Adam | epoch: 002 | loss: 0.54464 - acc: 0.7245 -- iter: 07680/24500


Training Step: 504  | total loss: 

0.54470

 | time: 31.601s


| Adam | epoch: 002 | loss: 0.54470 - acc: 0.7240 -- iter: 07744/24500


Training Step: 505  | total loss: 

0.54533

 | time: 31.844s


| Adam | epoch: 002 | loss: 0.54533 - acc: 0.7297 -- iter: 07808/24500


Training Step: 506  | total loss: 

0.54458

 | time: 32.089s


| Adam | epoch: 002 | loss: 0.54458 - acc: 0.7255 -- iter: 07872/24500


Training Step: 507  | total loss: 

0.54521

 | time: 32.339s


| Adam | epoch: 002 | loss: 0.54521 - acc: 0.7310 -- iter: 07936/24500


Training Step: 508  | total loss: 

0.54387

 | time: 32.576s


| Adam | epoch: 002 | loss: 0.54387 - acc: 0.7329 -- iter: 08000/24500


Training Step: 509  | total loss: 

0.53478

 | time: 32.819s


| Adam | epoch: 002 | loss: 0.53478 - acc: 0.7362 -- iter: 08064/24500


Training Step: 510  | total loss: 

0.54335

 | time: 33.059s


| Adam | epoch: 002 | loss: 0.54335 - acc: 0.7313 -- iter: 08128/24500


Training Step: 511  | total loss: 

0.54167

 | time: 33.313s


| Adam | epoch: 002 | loss: 0.54167 - acc: 0.7410 -- iter: 08192/24500


Training Step: 512  | total loss: 

0.54258

 | time: 33.560s


| Adam | epoch: 002 | loss: 0.54258 - acc: 0.7419 -- iter: 08256/24500


Training Step: 513  | total loss: 

0.53930

 | time: 33.807s


| Adam | epoch: 002 | loss: 0.53930 - acc: 0.7427 -- iter: 08320/24500


Training Step: 514  | total loss: 

0.53580

 | time: 34.050s


| Adam | epoch: 002 | loss: 0.53580 - acc: 0.7497 -- iter: 08384/24500


Training Step: 515  | total loss: 

0.54419

 | time: 34.298s


| Adam | epoch: 002 | loss: 0.54419 - acc: 0.7419 -- iter: 08448/24500


Training Step: 516  | total loss: 

0.54733

 | time: 34.541s


| Adam | epoch: 002 | loss: 0.54733 - acc: 0.7412 -- iter: 08512/24500


Training Step: 517  | total loss: 

0.55302

 | time: 34.787s


| Adam | epoch: 002 | loss: 0.55302 - acc: 0.7311 -- iter: 08576/24500


Training Step: 518  | total loss: 

0.55809

 | time: 35.026s


| Adam | epoch: 002 | loss: 0.55809 - acc: 0.7205 -- iter: 08640/24500


Training Step: 519  | total loss: 

0.56230

 | time: 35.262s


| Adam | epoch: 002 | loss: 0.56230 - acc: 0.7219 -- iter: 08704/24500


Training Step: 520  | total loss: 

0.55836

 | time: 35.491s


| Adam | epoch: 002 | loss: 0.55836 - acc: 0.7231 -- iter: 08768/24500


Training Step: 521  | total loss: 

0.56367

 | time: 35.738s


| Adam | epoch: 002 | loss: 0.56367 - acc: 0.7180 -- iter: 08832/24500


Training Step: 522  | total loss: 

0.56236

 | time: 35.983s


| Adam | epoch: 002 | loss: 0.56236 - acc: 0.7212 -- iter: 08896/24500


Training Step: 523  | total loss: 

0.55762

 | time: 36.236s


| Adam | epoch: 002 | loss: 0.55762 - acc: 0.7241 -- iter: 08960/24500


Training Step: 524  | total loss: 

0.56214

 | time: 36.475s


| Adam | epoch: 002 | loss: 0.56214 - acc: 0.7204 -- iter: 09024/24500


Training Step: 525  | total loss: 

0.56642

 | time: 36.723s


| Adam | epoch: 002 | loss: 0.56642 - acc: 0.7187 -- iter: 09088/24500


Training Step: 526  | total loss: 

0.56741

 | time: 36.962s


| Adam | epoch: 002 | loss: 0.56741 - acc: 0.7140 -- iter: 09152/24500


Training Step: 527  | total loss: 

0.56981

 | time: 37.202s


| Adam | epoch: 002 | loss: 0.56981 - acc: 0.7129 -- iter: 09216/24500


Training Step: 528  | total loss: 

0.57900

 | time: 37.443s


| Adam | epoch: 002 | loss: 0.57900 - acc: 0.7073 -- iter: 09280/24500


Training Step: 529  | total loss: 

0.57148

 | time: 37.689s


| Adam | epoch: 002 | loss: 0.57148 - acc: 0.7084 -- iter: 09344/24500


Training Step: 530  | total loss: 

0.56575

 | time: 37.935s


| Adam | epoch: 002 | loss: 0.56575 - acc: 0.7157 -- iter: 09408/24500


Training Step: 531  | total loss: 

0.56336

 | time: 38.177s


| Adam | epoch: 002 | loss: 0.56336 - acc: 0.7129 -- iter: 09472/24500


Training Step: 532  | total loss: 

0.56291

 | time: 38.410s


| Adam | epoch: 002 | loss: 0.56291 - acc: 0.7135 -- iter: 09536/24500


Training Step: 533  | total loss: 

0.56693

 | time: 38.653s


| Adam | epoch: 002 | loss: 0.56693 - acc: 0.7046 -- iter: 09600/24500


Training Step: 534  | total loss: 

0.56885

 | time: 38.895s


| Adam | epoch: 002 | loss: 0.56885 - acc: 0.7029 -- iter: 09664/24500


Training Step: 535  | total loss: 

0.55869

 | time: 39.149s


| Adam | epoch: 002 | loss: 0.55869 - acc: 0.7107 -- iter: 09728/24500


Training Step: 536  | total loss: 

0.55812

 | time: 39.382s


| Adam | epoch: 002 | loss: 0.55812 - acc: 0.7131 -- iter: 09792/24500


Training Step: 537  | total loss: 

0.54645

 | time: 39.622s


| Adam | epoch: 002 | loss: 0.54645 - acc: 0.7246 -- iter: 09856/24500


Training Step: 538  | total loss: 

0.55610

 | time: 39.865s


| Adam | epoch: 002 | loss: 0.55610 - acc: 0.7162 -- iter: 09920/24500


Training Step: 539  | total loss: 

0.55890

 | time: 40.111s


| Adam | epoch: 002 | loss: 0.55890 - acc: 0.7133 -- iter: 09984/24500


Training Step: 540  | total loss: 

0.55418

 | time: 40.360s


| Adam | epoch: 002 | loss: 0.55418 - acc: 0.7233 -- iter: 10048/24500


Training Step: 541  | total loss: 

0.56078

 | time: 40.609s


| Adam | epoch: 002 | loss: 0.56078 - acc: 0.7166 -- iter: 10112/24500


Training Step: 542  | total loss: 

0.54654

 | time: 40.845s


| Adam | epoch: 002 | loss: 0.54654 - acc: 0.7277 -- iter: 10176/24500


Training Step: 543  | total loss: 

0.55486

 | time: 41.120s


| Adam | epoch: 002 | loss: 0.55486 - acc: 0.7237 -- iter: 10240/24500


Training Step: 544  | total loss: 

0.55061

 | time: 41.447s


| Adam | epoch: 002 | loss: 0.55061 - acc: 0.7263 -- iter: 10304/24500


Training Step: 545  | total loss: 

0.54485

 | time: 41.686s


| Adam | epoch: 002 | loss: 0.54485 - acc: 0.7318 -- iter: 10368/24500


Training Step: 546  | total loss: 

0.53818

 | time: 41.928s


| Adam | epoch: 002 | loss: 0.53818 - acc: 0.7336 -- iter: 10432/24500


Training Step: 547  | total loss: 

0.53616

 | time: 42.165s


| Adam | epoch: 002 | loss: 0.53616 - acc: 0.7306 -- iter: 10496/24500


Training Step: 548  | total loss: 

0.53906

 | time: 42.406s


| Adam | epoch: 002 | loss: 0.53906 - acc: 0.7325 -- iter: 10560/24500


Training Step: 549  | total loss: 

0.54584

 | time: 42.648s


| Adam | epoch: 002 | loss: 0.54584 - acc: 0.7233 -- iter: 10624/24500


Training Step: 550  | total loss: 

0.54299

 | time: 42.891s


| Adam | epoch: 002 | loss: 0.54299 - acc: 0.7260 -- iter: 10688/24500


Training Step: 551  | total loss: 

0.53122

 | time: 43.130s


| Adam | epoch: 002 | loss: 0.53122 - acc: 0.7346 -- iter: 10752/24500


Training Step: 552  | total loss: 

0.52505

 | time: 43.374s


| Adam | epoch: 002 | loss: 0.52505 - acc: 0.7362 -- iter: 10816/24500


Training Step: 553  | total loss: 

0.51850

 | time: 43.629s


| Adam | epoch: 002 | loss: 0.51850 - acc: 0.7360 -- iter: 10880/24500


Training Step: 554  | total loss: 

0.52329

 | time: 43.879s


| Adam | epoch: 002 | loss: 0.52329 - acc: 0.7343 -- iter: 10944/24500


Training Step: 555  | total loss: 

0.53859

 | time: 44.122s


| Adam | epoch: 002 | loss: 0.53859 - acc: 0.7234 -- iter: 11008/24500


Training Step: 556  | total loss: 

0.54554

 | time: 44.367s


| Adam | epoch: 002 | loss: 0.54554 - acc: 0.7245 -- iter: 11072/24500


Training Step: 557  | total loss: 

0.53598

 | time: 44.606s


| Adam | epoch: 002 | loss: 0.53598 - acc: 0.7317 -- iter: 11136/24500


Training Step: 558  | total loss: 

0.53666

 | time: 44.860s


| Adam | epoch: 002 | loss: 0.53666 - acc: 0.7273 -- iter: 11200/24500


Training Step: 559  | total loss: 

0.54303

 | time: 45.096s


| Adam | epoch: 002 | loss: 0.54303 - acc: 0.7249 -- iter: 11264/24500


Training Step: 560  | total loss: 

0.54262

 | time: 45.341s


| Adam | epoch: 002 | loss: 0.54262 - acc: 0.7211 -- iter: 11328/24500


Training Step: 561  | total loss: 

0.53656

 | time: 45.587s


| Adam | epoch: 002 | loss: 0.53656 - acc: 0.7318 -- iter: 11392/24500


Training Step: 562  | total loss: 

0.53624

 | time: 45.826s


| Adam | epoch: 002 | loss: 0.53624 - acc: 0.7305 -- iter: 11456/24500


Training Step: 563  | total loss: 

0.54335

 | time: 46.072s


| Adam | epoch: 002 | loss: 0.54335 - acc: 0.7262 -- iter: 11520/24500


Training Step: 564  | total loss: 

0.53946

 | time: 46.315s


| Adam | epoch: 002 | loss: 0.53946 - acc: 0.7239 -- iter: 11584/24500


Training Step: 565  | total loss: 

0.53986

 | time: 46.559s


| Adam | epoch: 002 | loss: 0.53986 - acc: 0.7203 -- iter: 11648/24500


Training Step: 566  | total loss: 

0.53679

 | time: 46.807s


| Adam | epoch: 002 | loss: 0.53679 - acc: 0.7295 -- iter: 11712/24500


Training Step: 567  | total loss: 

0.54857

 | time: 47.050s


| Adam | epoch: 002 | loss: 0.54857 - acc: 0.7190 -- iter: 11776/24500


Training Step: 568  | total loss: 

0.56605

 | time: 47.313s


| Adam | epoch: 002 | loss: 0.56605 - acc: 0.7081 -- iter: 11840/24500


Training Step: 569  | total loss: 

0.57064

 | time: 47.564s


| Adam | epoch: 002 | loss: 0.57064 - acc: 0.7091 -- iter: 11904/24500


Training Step: 570  | total loss: 

0.56422

 | time: 47.815s


| Adam | epoch: 002 | loss: 0.56422 - acc: 0.7148 -- iter: 11968/24500


Training Step: 571  | total loss: 

0.56794

 | time: 48.060s


| Adam | epoch: 002 | loss: 0.56794 - acc: 0.7089 -- iter: 12032/24500


Training Step: 572  | total loss: 

0.56502

 | time: 48.298s


| Adam | epoch: 002 | loss: 0.56502 - acc: 0.7068 -- iter: 12096/24500


Training Step: 573  | total loss: 

0.56608

 | time: 48.542s


| Adam | epoch: 002 | loss: 0.56608 - acc: 0.7017 -- iter: 12160/24500


Training Step: 574  | total loss: 

0.55543

 | time: 48.787s


| Adam | epoch: 002 | loss: 0.55543 - acc: 0.7144 -- iter: 12224/24500


Training Step: 575  | total loss: 

0.55222

 | time: 49.026s


| Adam | epoch: 002 | loss: 0.55222 - acc: 0.7258 -- iter: 12288/24500


Training Step: 576  | total loss: 

0.54867

 | time: 49.272s


| Adam | epoch: 002 | loss: 0.54867 - acc: 0.7251 -- iter: 12352/24500


Training Step: 577  | total loss: 

0.54670

 | time: 49.504s


| Adam | epoch: 002 | loss: 0.54670 - acc: 0.7229 -- iter: 12416/24500


Training Step: 578  | total loss: 

0.55353

 | time: 49.756s


| Adam | epoch: 002 | loss: 0.55353 - acc: 0.7193 -- iter: 12480/24500


Training Step: 579  | total loss: 

0.54859

 | time: 50.001s


| Adam | epoch: 002 | loss: 0.54859 - acc: 0.7240 -- iter: 12544/24500


Training Step: 580  | total loss: 

0.55065

 | time: 50.238s


| Adam | epoch: 002 | loss: 0.55065 - acc: 0.7219 -- iter: 12608/24500


Training Step: 581  | total loss: 

0.55152

 | time: 50.478s


| Adam | epoch: 002 | loss: 0.55152 - acc: 0.7216 -- iter: 12672/24500


Training Step: 582  | total loss: 

0.54753

 | time: 50.726s


| Adam | epoch: 002 | loss: 0.54753 - acc: 0.7275 -- iter: 12736/24500


Training Step: 583  | total loss: 

0.56892

 | time: 50.971s


| Adam | epoch: 002 | loss: 0.56892 - acc: 0.7188 -- iter: 12800/24500


Training Step: 584  | total loss: 

0.58896

 | time: 51.213s


| Adam | epoch: 002 | loss: 0.58896 - acc: 0.7079 -- iter: 12864/24500


Training Step: 585  | total loss: 

0.57709

 | time: 51.446s


| Adam | epoch: 002 | loss: 0.57709 - acc: 0.7152 -- iter: 12928/24500


Training Step: 586  | total loss: 

0.57109

 | time: 51.691s


| Adam | epoch: 002 | loss: 0.57109 - acc: 0.7250 -- iter: 12992/24500


Training Step: 587  | total loss: 

0.57547

 | time: 51.937s


| Adam | epoch: 002 | loss: 0.57547 - acc: 0.7196 -- iter: 13056/24500


Training Step: 588  | total loss: 

0.57883

 | time: 52.181s


| Adam | epoch: 002 | loss: 0.57883 - acc: 0.7133 -- iter: 13120/24500


Training Step: 589  | total loss: 

0.58004

 | time: 52.426s


| Adam | epoch: 002 | loss: 0.58004 - acc: 0.7107 -- iter: 13184/24500


Training Step: 590  | total loss: 

0.56603

 | time: 52.667s


| Adam | epoch: 002 | loss: 0.56603 - acc: 0.7240 -- iter: 13248/24500


Training Step: 591  | total loss: 

0.55768

 | time: 52.918s


| Adam | epoch: 002 | loss: 0.55768 - acc: 0.7298 -- iter: 13312/24500


Training Step: 592  | total loss: 

0.55285

 | time: 53.153s


| Adam | epoch: 002 | loss: 0.55285 - acc: 0.7349 -- iter: 13376/24500


Training Step: 593  | total loss: 

0.54832

 | time: 53.396s


| Adam | epoch: 002 | loss: 0.54832 - acc: 0.7380 -- iter: 13440/24500


Training Step: 594  | total loss: 

0.55369

 | time: 53.649s


| Adam | epoch: 002 | loss: 0.55369 - acc: 0.7329 -- iter: 13504/24500


Training Step: 595  | total loss: 

0.56310

 | time: 53.898s


| Adam | epoch: 002 | loss: 0.56310 - acc: 0.7237 -- iter: 13568/24500


Training Step: 596  | total loss: 

0.55765

 | time: 54.141s


| Adam | epoch: 002 | loss: 0.55765 - acc: 0.7295 -- iter: 13632/24500


Training Step: 597  | total loss: 

0.55849

 | time: 54.384s


| Adam | epoch: 002 | loss: 0.55849 - acc: 0.7253 -- iter: 13696/24500


Training Step: 598  | total loss: 

0.55110

 | time: 54.630s


| Adam | epoch: 002 | loss: 0.55110 - acc: 0.7340 -- iter: 13760/24500


Training Step: 599  | total loss: 

0.55070

 | time: 54.875s


| Adam | epoch: 002 | loss: 0.55070 - acc: 0.7387 -- iter: 13824/24500


Training Step: 600  | total loss: 

0.54451

 | time: 55.118s


| Adam | epoch: 002 | loss: 0.54451 - acc: 0.7367 -- iter: 13888/24500


Training Step: 601  | total loss: 

0.54117

 | time: 55.359s


| Adam | epoch: 002 | loss: 0.54117 - acc: 0.7412 -- iter: 13952/24500


Training Step: 602  | total loss: 

0.54591

 | time: 55.613s


| Adam | epoch: 002 | loss: 0.54591 - acc: 0.7374 -- iter: 14016/24500


Training Step: 603  | total loss: 

0.55636

 | time: 55.858s


| Adam | epoch: 002 | loss: 0.55636 - acc: 0.7308 -- iter: 14080/24500


Training Step: 604  | total loss: 

0.55574

 | time: 56.096s


| Adam | epoch: 002 | loss: 0.55574 - acc: 0.7265 -- iter: 14144/24500


Training Step: 605  | total loss: 

0.55398

 | time: 56.332s


| Adam | epoch: 002 | loss: 0.55398 - acc: 0.7288 -- iter: 14208/24500


Training Step: 606  | total loss: 

0.55416

 | time: 56.581s


| Adam | epoch: 002 | loss: 0.55416 - acc: 0.7231 -- iter: 14272/24500


Training Step: 607  | total loss: 

0.56281

 | time: 56.821s


| Adam | epoch: 002 | loss: 0.56281 - acc: 0.7118 -- iter: 14336/24500


Training Step: 608  | total loss: 

0.56071

 | time: 57.070s


| Adam | epoch: 002 | loss: 0.56071 - acc: 0.7171 -- iter: 14400/24500


Training Step: 609  | total loss: 

0.55797

 | time: 57.315s


| Adam | epoch: 002 | loss: 0.55797 - acc: 0.7220 -- iter: 14464/24500


Training Step: 610  | total loss: 

0.55611

 | time: 57.560s


| Adam | epoch: 002 | loss: 0.55611 - acc: 0.7232 -- iter: 14528/24500


Training Step: 611  | total loss: 

0.55938

 | time: 57.811s


| Adam | epoch: 002 | loss: 0.55938 - acc: 0.7181 -- iter: 14592/24500


Training Step: 612  | total loss: 

0.56419

 | time: 58.065s


| Adam | epoch: 002 | loss: 0.56419 - acc: 0.7135 -- iter: 14656/24500


Training Step: 613  | total loss: 

0.56562

 | time: 58.306s


| Adam | epoch: 002 | loss: 0.56562 - acc: 0.7140 -- iter: 14720/24500


Training Step: 614  | total loss: 

0.56432

 | time: 58.539s


| Adam | epoch: 002 | loss: 0.56432 - acc: 0.7176 -- iter: 14784/24500


Training Step: 615  | total loss: 

0.56393

 | time: 58.782s


| Adam | epoch: 002 | loss: 0.56393 - acc: 0.7177 -- iter: 14848/24500


Training Step: 616  | total loss: 

0.56483

 | time: 59.023s


| Adam | epoch: 002 | loss: 0.56483 - acc: 0.7147 -- iter: 14912/24500


Training Step: 617  | total loss: 

0.55621

 | time: 59.272s


| Adam | epoch: 002 | loss: 0.55621 - acc: 0.7214 -- iter: 14976/24500


Training Step: 618  | total loss: 

0.55267

 | time: 59.524s


| Adam | epoch: 002 | loss: 0.55267 - acc: 0.7227 -- iter: 15040/24500


Training Step: 619  | total loss: 

0.55697

 | time: 59.760s


| Adam | epoch: 002 | loss: 0.55697 - acc: 0.7207 -- iter: 15104/24500


Training Step: 620  | total loss: 

0.55695

 | time: 60.012s


| Adam | epoch: 002 | loss: 0.55695 - acc: 0.7205 -- iter: 15168/24500


Training Step: 621  | total loss: 

0.55843

 | time: 60.263s


| Adam | epoch: 002 | loss: 0.55843 - acc: 0.7266 -- iter: 15232/24500


Training Step: 622  | total loss: 

0.55552

 | time: 60.506s


| Adam | epoch: 002 | loss: 0.55552 - acc: 0.7289 -- iter: 15296/24500


Training Step: 623  | total loss: 

0.55688

 | time: 60.760s


| Adam | epoch: 002 | loss: 0.55688 - acc: 0.7279 -- iter: 15360/24500


Training Step: 624  | total loss: 

0.54701

 | time: 61.016s


| Adam | epoch: 002 | loss: 0.54701 - acc: 0.7332 -- iter: 15424/24500


Training Step: 625  | total loss: 

0.54763

 | time: 61.255s


| Adam | epoch: 002 | loss: 0.54763 - acc: 0.7255 -- iter: 15488/24500


Training Step: 626  | total loss: 

0.54224

 | time: 61.504s


| Adam | epoch: 002 | loss: 0.54224 - acc: 0.7280 -- iter: 15552/24500


Training Step: 627  | total loss: 

0.54799

 | time: 61.742s


| Adam | epoch: 002 | loss: 0.54799 - acc: 0.7224 -- iter: 15616/24500


Training Step: 628  | total loss: 

0.56099

 | time: 61.975s


| Adam | epoch: 002 | loss: 0.56099 - acc: 0.7142 -- iter: 15680/24500


Training Step: 629  | total loss: 

0.55127

 | time: 62.220s


| Adam | epoch: 002 | loss: 0.55127 - acc: 0.7225 -- iter: 15744/24500


Training Step: 630  | total loss: 

0.55765

 | time: 62.452s


| Adam | epoch: 002 | loss: 0.55765 - acc: 0.7096 -- iter: 15808/24500


Training Step: 631  | total loss: 

0.55972

 | time: 62.705s


| Adam | epoch: 002 | loss: 0.55972 - acc: 0.7074 -- iter: 15872/24500


Training Step: 632  | total loss: 

0.54606

 | time: 62.944s


| Adam | epoch: 002 | loss: 0.54606 - acc: 0.7210 -- iter: 15936/24500


Training Step: 633  | total loss: 

0.54100

 | time: 63.187s


| Adam | epoch: 002 | loss: 0.54100 - acc: 0.7286 -- iter: 16000/24500


Training Step: 634  | total loss: 

0.53912

 | time: 63.433s


| Adam | epoch: 002 | loss: 0.53912 - acc: 0.7339 -- iter: 16064/24500


Training Step: 635  | total loss: 

0.53428

 | time: 63.672s


| Adam | epoch: 002 | loss: 0.53428 - acc: 0.7370 -- iter: 16128/24500


Training Step: 636  | total loss: 

0.53956

 | time: 63.913s


| Adam | epoch: 002 | loss: 0.53956 - acc: 0.7290 -- iter: 16192/24500


Training Step: 637  | total loss: 

0.54355

 | time: 64.157s


| Adam | epoch: 002 | loss: 0.54355 - acc: 0.7264 -- iter: 16256/24500


Training Step: 638  | total loss: 

0.54780

 | time: 64.406s


| Adam | epoch: 002 | loss: 0.54780 - acc: 0.7225 -- iter: 16320/24500


Training Step: 639  | total loss: 

0.55045

 | time: 64.643s


| Adam | epoch: 002 | loss: 0.55045 - acc: 0.7221 -- iter: 16384/24500


Training Step: 640  | total loss: 

0.55109

 | time: 64.890s


| Adam | epoch: 002 | loss: 0.55109 - acc: 0.7202 -- iter: 16448/24500


Training Step: 641  | total loss: 

0.54622

 | time: 65.142s


| Adam | epoch: 002 | loss: 0.54622 - acc: 0.7248 -- iter: 16512/24500


Training Step: 642  | total loss: 

0.54984

 | time: 65.389s


| Adam | epoch: 002 | loss: 0.54984 - acc: 0.7257 -- iter: 16576/24500


Training Step: 643  | total loss: 

0.55127

 | time: 65.632s


| Adam | epoch: 002 | loss: 0.55127 - acc: 0.7235 -- iter: 16640/24500


Training Step: 644  | total loss: 

0.54748

 | time: 65.874s


| Adam | epoch: 002 | loss: 0.54748 - acc: 0.7246 -- iter: 16704/24500


Training Step: 645  | total loss: 

0.54583

 | time: 66.128s


| Adam | epoch: 002 | loss: 0.54583 - acc: 0.7287 -- iter: 16768/24500


Training Step: 646  | total loss: 

0.54993

 | time: 66.366s


| Adam | epoch: 002 | loss: 0.54993 - acc: 0.7277 -- iter: 16832/24500


Training Step: 647  | total loss: 

0.54027

 | time: 66.613s


| Adam | epoch: 002 | loss: 0.54027 - acc: 0.7362 -- iter: 16896/24500


Training Step: 648  | total loss: 

0.54066

 | time: 66.851s


| Adam | epoch: 002 | loss: 0.54066 - acc: 0.7344 -- iter: 16960/24500


Training Step: 649  | total loss: 

0.54125

 | time: 67.102s


| Adam | epoch: 002 | loss: 0.54125 - acc: 0.7375 -- iter: 17024/24500


Training Step: 650  | total loss: 

0.54732

 | time: 67.350s


| Adam | epoch: 002 | loss: 0.54732 - acc: 0.7357 -- iter: 17088/24500


Training Step: 651  | total loss: 

0.54271

 | time: 67.597s


| Adam | epoch: 002 | loss: 0.54271 - acc: 0.7387 -- iter: 17152/24500


Training Step: 652  | total loss: 

0.53807

 | time: 67.841s


| Adam | epoch: 002 | loss: 0.53807 - acc: 0.7445 -- iter: 17216/24500


Training Step: 653  | total loss: 

0.53645

 | time: 68.082s


| Adam | epoch: 002 | loss: 0.53645 - acc: 0.7466 -- iter: 17280/24500


Training Step: 654  | total loss: 

0.52239

 | time: 68.321s


| Adam | epoch: 002 | loss: 0.52239 - acc: 0.7579 -- iter: 17344/24500


Training Step: 655  | total loss: 

0.51974

 | time: 68.568s


| Adam | epoch: 002 | loss: 0.51974 - acc: 0.7571 -- iter: 17408/24500


Training Step: 656  | total loss: 

0.53405

 | time: 68.798s


| Adam | epoch: 002 | loss: 0.53405 - acc: 0.7439 -- iter: 17472/24500


Training Step: 657  | total loss: 

0.53978

 | time: 69.037s


| Adam | epoch: 002 | loss: 0.53978 - acc: 0.7367 -- iter: 17536/24500


Training Step: 658  | total loss: 

0.54156

 | time: 69.289s


| Adam | epoch: 002 | loss: 0.54156 - acc: 0.7349 -- iter: 17600/24500


Training Step: 659  | total loss: 

0.53964

 | time: 69.532s


| Adam | epoch: 002 | loss: 0.53964 - acc: 0.7364 -- iter: 17664/24500


Training Step: 660  | total loss: 

0.53612

 | time: 69.778s


| Adam | epoch: 002 | loss: 0.53612 - acc: 0.7409 -- iter: 17728/24500


Training Step: 661  | total loss: 

0.52524

 | time: 70.015s


| Adam | epoch: 002 | loss: 0.52524 - acc: 0.7496 -- iter: 17792/24500


Training Step: 662  | total loss: 

0.53906

 | time: 70.265s


| Adam | epoch: 002 | loss: 0.53906 - acc: 0.7309 -- iter: 17856/24500


Training Step: 663  | total loss: 

0.54796

 | time: 70.516s


| Adam | epoch: 002 | loss: 0.54796 - acc: 0.7203 -- iter: 17920/24500


Training Step: 664  | total loss: 

0.54599

 | time: 70.750s


| Adam | epoch: 002 | loss: 0.54599 - acc: 0.7201 -- iter: 17984/24500


Training Step: 665  | total loss: 

0.56158

 | time: 70.997s


| Adam | epoch: 002 | loss: 0.56158 - acc: 0.7106 -- iter: 18048/24500


Training Step: 666  | total loss: 

0.56016

 | time: 71.241s


| Adam | epoch: 002 | loss: 0.56016 - acc: 0.7130 -- iter: 18112/24500


Training Step: 667  | total loss: 

0.55597

 | time: 71.478s


| Adam | epoch: 002 | loss: 0.55597 - acc: 0.7136 -- iter: 18176/24500


Training Step: 668  | total loss: 

0.55309

 | time: 71.718s


| Adam | epoch: 002 | loss: 0.55309 - acc: 0.7110 -- iter: 18240/24500


Training Step: 669  | total loss: 

0.54661

 | time: 71.967s


| Adam | epoch: 002 | loss: 0.54661 - acc: 0.7180 -- iter: 18304/24500


Training Step: 670  | total loss: 

0.54978

 | time: 72.213s


| Adam | epoch: 002 | loss: 0.54978 - acc: 0.7118 -- iter: 18368/24500


Training Step: 671  | total loss: 

0.54661

 | time: 72.461s


| Adam | epoch: 002 | loss: 0.54661 - acc: 0.7188 -- iter: 18432/24500


Training Step: 672  | total loss: 

0.54789

 | time: 72.708s


| Adam | epoch: 002 | loss: 0.54789 - acc: 0.7203 -- iter: 18496/24500


Training Step: 673  | total loss: 

0.55260

 | time: 72.947s


| Adam | epoch: 002 | loss: 0.55260 - acc: 0.7155 -- iter: 18560/24500


Training Step: 674  | total loss: 

0.54660

 | time: 73.193s


| Adam | epoch: 002 | loss: 0.54660 - acc: 0.7142 -- iter: 18624/24500


Training Step: 675  | total loss: 

0.55919

 | time: 73.436s


| Adam | epoch: 002 | loss: 0.55919 - acc: 0.7069 -- iter: 18688/24500


Training Step: 676  | total loss: 

0.56203

 | time: 73.687s


| Adam | epoch: 002 | loss: 0.56203 - acc: 0.7112 -- iter: 18752/24500


Training Step: 677  | total loss: 

0.55986

 | time: 73.928s


| Adam | epoch: 002 | loss: 0.55986 - acc: 0.7104 -- iter: 18816/24500


Training Step: 678  | total loss: 

0.55929

 | time: 74.169s


| Adam | epoch: 002 | loss: 0.55929 - acc: 0.7144 -- iter: 18880/24500


Training Step: 679  | total loss: 

0.56282

 | time: 74.417s


| Adam | epoch: 002 | loss: 0.56282 - acc: 0.7132 -- iter: 18944/24500


Training Step: 680  | total loss: 

0.56126

 | time: 74.655s


| Adam | epoch: 002 | loss: 0.56126 - acc: 0.7185 -- iter: 19008/24500


Training Step: 681  | total loss: 

0.54944

 | time: 74.888s


| Adam | epoch: 002 | loss: 0.54944 - acc: 0.7279 -- iter: 19072/24500


Training Step: 682  | total loss: 

0.53745

 | time: 75.132s


| Adam | epoch: 002 | loss: 0.53745 - acc: 0.7395 -- iter: 19136/24500


Training Step: 683  | total loss: 

0.53737

 | time: 75.371s


| Adam | epoch: 002 | loss: 0.53737 - acc: 0.7374 -- iter: 19200/24500


Training Step: 684  | total loss: 

0.52868

 | time: 75.608s


| Adam | epoch: 002 | loss: 0.52868 - acc: 0.7527 -- iter: 19264/24500


Training Step: 685  | total loss: 

0.52413

 | time: 75.843s


| Adam | epoch: 002 | loss: 0.52413 - acc: 0.7556 -- iter: 19328/24500


Training Step: 686  | total loss: 

0.52622

 | time: 76.086s


| Adam | epoch: 002 | loss: 0.52622 - acc: 0.7534 -- iter: 19392/24500


Training Step: 687  | total loss: 

0.53992

 | time: 76.333s


| Adam | epoch: 002 | loss: 0.53992 - acc: 0.7437 -- iter: 19456/24500


Training Step: 688  | total loss: 

0.54010

 | time: 76.572s


| Adam | epoch: 002 | loss: 0.54010 - acc: 0.7475 -- iter: 19520/24500


Training Step: 689  | total loss: 

0.52674

 | time: 76.810s


| Adam | epoch: 002 | loss: 0.52674 - acc: 0.7571 -- iter: 19584/24500


Training Step: 690  | total loss: 

0.51744

 | time: 77.049s


| Adam | epoch: 002 | loss: 0.51744 - acc: 0.7564 -- iter: 19648/24500


Training Step: 691  | total loss: 

0.51682

 | time: 77.296s


| Adam | epoch: 002 | loss: 0.51682 - acc: 0.7558 -- iter: 19712/24500


Training Step: 692  | total loss: 

0.51606

 | time: 77.542s


| Adam | epoch: 002 | loss: 0.51606 - acc: 0.7614 -- iter: 19776/24500


Training Step: 693  | total loss: 

0.51129

 | time: 77.779s


| Adam | epoch: 002 | loss: 0.51129 - acc: 0.7665 -- iter: 19840/24500


Training Step: 694  | total loss: 

0.51006

 | time: 78.026s


| Adam | epoch: 002 | loss: 0.51006 - acc: 0.7664 -- iter: 19904/24500


Training Step: 695  | total loss: 

0.51371

 | time: 78.262s


| Adam | epoch: 002 | loss: 0.51371 - acc: 0.7664 -- iter: 19968/24500


Training Step: 696  | total loss: 

0.52209

 | time: 78.501s


| Adam | epoch: 002 | loss: 0.52209 - acc: 0.7522 -- iter: 20032/24500


Training Step: 697  | total loss: 

0.53419

 | time: 78.742s


| Adam | epoch: 002 | loss: 0.53419 - acc: 0.7473 -- iter: 20096/24500


Training Step: 698  | total loss: 

0.52731

 | time: 78.986s


| Adam | epoch: 002 | loss: 0.52731 - acc: 0.7476 -- iter: 20160/24500


Training Step: 699  | total loss: 

0.53167

 | time: 79.220s


| Adam | epoch: 002 | loss: 0.53167 - acc: 0.7447 -- iter: 20224/24500


Training Step: 700  | total loss: 

0.52571

 | time: 79.465s


| Adam | epoch: 002 | loss: 0.52571 - acc: 0.7499 -- iter: 20288/24500


Training Step: 701  | total loss: 

0.54023

 | time: 79.713s


| Adam | epoch: 002 | loss: 0.54023 - acc: 0.7499 -- iter: 20352/24500


Training Step: 702  | total loss: 

0.53889

 | time: 79.953s


| Adam | epoch: 002 | loss: 0.53889 - acc: 0.7452 -- iter: 20416/24500


Training Step: 703  | total loss: 

0.54939

 | time: 80.198s


| Adam | epoch: 002 | loss: 0.54939 - acc: 0.7363 -- iter: 20480/24500


Training Step: 704  | total loss: 

0.55040

 | time: 80.442s


| Adam | epoch: 002 | loss: 0.55040 - acc: 0.7362 -- iter: 20544/24500


Training Step: 705  | total loss: 

0.56452

 | time: 80.684s


| Adam | epoch: 002 | loss: 0.56452 - acc: 0.7250 -- iter: 20608/24500


Training Step: 706  | total loss: 

0.55923

 | time: 80.927s


| Adam | epoch: 002 | loss: 0.55923 - acc: 0.7291 -- iter: 20672/24500


Training Step: 707  | total loss: 

0.57536

 | time: 81.172s


| Adam | epoch: 002 | loss: 0.57536 - acc: 0.7093 -- iter: 20736/24500


Training Step: 708  | total loss: 

0.57940

 | time: 81.411s


| Adam | epoch: 002 | loss: 0.57940 - acc: 0.7071 -- iter: 20800/24500


Training Step: 709  | total loss: 

0.57147

 | time: 81.653s


| Adam | epoch: 002 | loss: 0.57147 - acc: 0.7161 -- iter: 20864/24500


Training Step: 710  | total loss: 

0.56919

 | time: 81.899s


| Adam | epoch: 002 | loss: 0.56919 - acc: 0.7211 -- iter: 20928/24500


Training Step: 711  | total loss: 

0.56912

 | time: 82.140s


| Adam | epoch: 002 | loss: 0.56912 - acc: 0.7146 -- iter: 20992/24500


Training Step: 712  | total loss: 

0.57174

 | time: 82.386s


| Adam | epoch: 002 | loss: 0.57174 - acc: 0.7119 -- iter: 21056/24500


Training Step: 713  | total loss: 

0.56759

 | time: 82.625s


| Adam | epoch: 002 | loss: 0.56759 - acc: 0.7172 -- iter: 21120/24500


Training Step: 714  | total loss: 

0.56599

 | time: 82.876s


| Adam | epoch: 002 | loss: 0.56599 - acc: 0.7111 -- iter: 21184/24500


Training Step: 715  | total loss: 

0.56120

 | time: 83.109s


| Adam | epoch: 002 | loss: 0.56120 - acc: 0.7103 -- iter: 21248/24500


Training Step: 716  | total loss: 

0.55630

 | time: 83.355s


| Adam | epoch: 002 | loss: 0.55630 - acc: 0.7159 -- iter: 21312/24500


Training Step: 717  | total loss: 

0.55257

 | time: 83.604s


| Adam | epoch: 002 | loss: 0.55257 - acc: 0.7240 -- iter: 21376/24500


Training Step: 718  | total loss: 

0.55021

 | time: 83.847s


| Adam | epoch: 002 | loss: 0.55021 - acc: 0.7203 -- iter: 21440/24500


Training Step: 719  | total loss: 

0.54152

 | time: 84.089s


| Adam | epoch: 002 | loss: 0.54152 - acc: 0.7280 -- iter: 21504/24500


Training Step: 720  | total loss: 

0.54391

 | time: 84.335s


| Adam | epoch: 002 | loss: 0.54391 - acc: 0.7302 -- iter: 21568/24500


Training Step: 721  | total loss: 

0.54586

 | time: 84.588s


| Adam | epoch: 002 | loss: 0.54586 - acc: 0.7259 -- iter: 21632/24500


Training Step: 722  | total loss: 

0.53845

 | time: 84.836s


| Adam | epoch: 002 | loss: 0.53845 - acc: 0.7299 -- iter: 21696/24500


Training Step: 723  | total loss: 

0.54157

 | time: 85.081s


| Adam | epoch: 002 | loss: 0.54157 - acc: 0.7319 -- iter: 21760/24500


Training Step: 724  | total loss: 

0.52718

 | time: 85.325s


| Adam | epoch: 002 | loss: 0.52718 - acc: 0.7400 -- iter: 21824/24500


Training Step: 725  | total loss: 

0.53715

 | time: 85.563s


| Adam | epoch: 002 | loss: 0.53715 - acc: 0.7316 -- iter: 21888/24500


Training Step: 726  | total loss: 

0.53265

 | time: 85.805s


| Adam | epoch: 002 | loss: 0.53265 - acc: 0.7381 -- iter: 21952/24500


Training Step: 727  | total loss: 

0.52339

 | time: 86.046s


| Adam | epoch: 002 | loss: 0.52339 - acc: 0.7377 -- iter: 22016/24500


Training Step: 728  | total loss: 

0.53870

 | time: 86.289s


| Adam | epoch: 002 | loss: 0.53870 - acc: 0.7358 -- iter: 22080/24500


Training Step: 729  | total loss: 

0.53929

 | time: 86.542s


| Adam | epoch: 002 | loss: 0.53929 - acc: 0.7404 -- iter: 22144/24500


Training Step: 730  | total loss: 

0.54868

 | time: 86.785s


| Adam | epoch: 002 | loss: 0.54868 - acc: 0.7351 -- iter: 22208/24500


Training Step: 731  | total loss: 

0.55291

 | time: 87.031s


| Adam | epoch: 002 | loss: 0.55291 - acc: 0.7350 -- iter: 22272/24500


Training Step: 732  | total loss: 

0.54921

 | time: 87.272s


| Adam | epoch: 002 | loss: 0.54921 - acc: 0.7412 -- iter: 22336/24500


Training Step: 733  | total loss: 

0.54672

 | time: 87.507s


| Adam | epoch: 002 | loss: 0.54672 - acc: 0.7358 -- iter: 22400/24500


Training Step: 734  | total loss: 

0.55331

 | time: 87.748s


| Adam | epoch: 002 | loss: 0.55331 - acc: 0.7341 -- iter: 22464/24500


Training Step: 735  | total loss: 

0.54437

 | time: 87.990s


| Adam | epoch: 002 | loss: 0.54437 - acc: 0.7404 -- iter: 22528/24500


Training Step: 736  | total loss: 

0.58673

 | time: 88.234s


| Adam | epoch: 002 | loss: 0.58673 - acc: 0.7148 -- iter: 22592/24500


Training Step: 737  | total loss: 

0.57975

 | time: 88.477s


| Adam | epoch: 002 | loss: 0.57975 - acc: 0.7199 -- iter: 22656/24500


Training Step: 738  | total loss: 

0.57795

 | time: 88.711s


| Adam | epoch: 002 | loss: 0.57795 - acc: 0.7182 -- iter: 22720/24500


Training Step: 739  | total loss: 

0.58892

 | time: 88.948s


| Adam | epoch: 002 | loss: 0.58892 - acc: 0.6995 -- iter: 22784/24500


Training Step: 740  | total loss: 

0.58605

 | time: 89.195s


| Adam | epoch: 002 | loss: 0.58605 - acc: 0.7046 -- iter: 22848/24500


Training Step: 741  | total loss: 

0.57698

 | time: 89.444s


| Adam | epoch: 002 | loss: 0.57698 - acc: 0.7185 -- iter: 22912/24500


Training Step: 742  | total loss: 

0.57294

 | time: 89.682s


| Adam | epoch: 002 | loss: 0.57294 - acc: 0.7232 -- iter: 22976/24500


Training Step: 743  | total loss: 

0.57225

 | time: 89.930s


| Adam | epoch: 002 | loss: 0.57225 - acc: 0.7259 -- iter: 23040/24500


Training Step: 744  | total loss: 

0.57204

 | time: 90.175s


| Adam | epoch: 002 | loss: 0.57204 - acc: 0.7236 -- iter: 23104/24500


Training Step: 745  | total loss: 

0.56688

 | time: 90.423s


| Adam | epoch: 002 | loss: 0.56688 - acc: 0.7294 -- iter: 23168/24500


Training Step: 746  | total loss: 

0.56624

 | time: 90.669s


| Adam | epoch: 002 | loss: 0.56624 - acc: 0.7299 -- iter: 23232/24500


Training Step: 747  | total loss: 

0.56164

 | time: 90.904s


| Adam | epoch: 002 | loss: 0.56164 - acc: 0.7334 -- iter: 23296/24500


Training Step: 748  | total loss: 

0.55717

 | time: 91.148s


| Adam | epoch: 002 | loss: 0.55717 - acc: 0.7320 -- iter: 23360/24500


Training Step: 749  | total loss: 

0.54668

 | time: 91.385s


| Adam | epoch: 002 | loss: 0.54668 - acc: 0.7385 -- iter: 23424/24500


Training Step: 750  | total loss: 

0.54411

 | time: 91.635s


| Adam | epoch: 002 | loss: 0.54411 - acc: 0.7396 -- iter: 23488/24500


Training Step: 751  | total loss: 

0.54026

 | time: 91.872s


| Adam | epoch: 002 | loss: 0.54026 - acc: 0.7360 -- iter: 23552/24500


Training Step: 752  | total loss: 

0.53228

 | time: 92.111s


| Adam | epoch: 002 | loss: 0.53228 - acc: 0.7374 -- iter: 23616/24500


Training Step: 753  | total loss: 

0.52835

 | time: 92.364s


| Adam | epoch: 002 | loss: 0.52835 - acc: 0.7449 -- iter: 23680/24500


Training Step: 754  | total loss: 

0.52003

 | time: 92.604s


| Adam | epoch: 002 | loss: 0.52003 - acc: 0.7485 -- iter: 23744/24500


Training Step: 755  | total loss: 

0.54058

 | time: 92.854s


| Adam | epoch: 002 | loss: 0.54058 - acc: 0.7299 -- iter: 23808/24500


Training Step: 756  | total loss: 

0.54416

 | time: 93.099s


| Adam | epoch: 002 | loss: 0.54416 - acc: 0.7335 -- iter: 23872/24500


Training Step: 757  | total loss: 

0.53851

 | time: 93.341s


| Adam | epoch: 002 | loss: 0.53851 - acc: 0.7383 -- iter: 23936/24500


Training Step: 758  | total loss: 

0.53330

 | time: 93.591s


| Adam | epoch: 002 | loss: 0.53330 - acc: 0.7394 -- iter: 24000/24500


Training Step: 759  | total loss: 

0.52987

 | time: 93.833s


| Adam | epoch: 002 | loss: 0.52987 - acc: 0.7374 -- iter: 24064/24500


Training Step: 760  | total loss: 

0.51780

 | time: 94.062s


| Adam | epoch: 002 | loss: 0.51780 - acc: 0.7433 -- iter: 24128/24500


Training Step: 761  | total loss: 

0.51448

 | time: 94.309s


| Adam | epoch: 002 | loss: 0.51448 - acc: 0.7440 -- iter: 24192/24500


Training Step: 762  | total loss: 

0.51614

 | time: 94.554s


| Adam | epoch: 002 | loss: 0.51614 - acc: 0.7462 -- iter: 24256/24500


Training Step: 763  | total loss: 

0.52340

 | time: 94.796s


| Adam | epoch: 002 | loss: 0.52340 - acc: 0.7340 -- iter: 24320/24500


Training Step: 764  | total loss: 

0.51405

 | time: 95.049s


| Adam | epoch: 002 | loss: 0.51405 - acc: 0.7388 -- iter: 24384/24500


Training Step: 765  | total loss: 

0.51945

 | time: 95.297s


| Adam | epoch: 002 | loss: 0.51945 - acc: 0.7352 -- iter: 24448/24500


Training Step: 766  | total loss: 

0.51404

 | time: 96.555s


| Adam | epoch: 002 | loss: 0.51404 - acc: 0.7414 | val_loss: 0.51185 - val_acc: 0.7560 -- iter: 24500/24500
--


Training Step: 767  | total loss: 

0.51055

 | time: 0.200s


| Adam | epoch: 003 | loss: 0.51055 - acc: 0.7422 -- iter: 00064/24500


Training Step: 768  | total loss: 

0.51052

 | time: 0.397s


| Adam | epoch: 003 | loss: 0.51052 - acc: 0.7507 -- iter: 00128/24500


Training Step: 769  | total loss: 

0.50759

 | time: 0.641s


| Adam | epoch: 003 | loss: 0.50759 - acc: 0.7506 -- iter: 00192/24500


Training Step: 770  | total loss: 

0.51979

 | time: 0.878s


| Adam | epoch: 003 | loss: 0.51979 - acc: 0.7459 -- iter: 00256/24500


Training Step: 771  | total loss: 

0.52059

 | time: 1.120s


| Adam | epoch: 003 | loss: 0.52059 - acc: 0.7416 -- iter: 00320/24500


Training Step: 772  | total loss: 

0.52316

 | time: 1.360s


| Adam | epoch: 003 | loss: 0.52316 - acc: 0.7362 -- iter: 00384/24500


Training Step: 773  | total loss: 

0.53215

 | time: 1.610s


| Adam | epoch: 003 | loss: 0.53215 - acc: 0.7298 -- iter: 00448/24500


Training Step: 774  | total loss: 

0.53359

 | time: 1.844s


| Adam | epoch: 003 | loss: 0.53359 - acc: 0.7287 -- iter: 00512/24500


Training Step: 775  | total loss: 

0.52424

 | time: 2.080s


| Adam | epoch: 003 | loss: 0.52424 - acc: 0.7292 -- iter: 00576/24500


Training Step: 776  | total loss: 

0.52542

 | time: 2.329s


| Adam | epoch: 003 | loss: 0.52542 - acc: 0.7282 -- iter: 00640/24500


Training Step: 777  | total loss: 

0.52601

 | time: 2.583s


| Adam | epoch: 003 | loss: 0.52601 - acc: 0.7288 -- iter: 00704/24500


Training Step: 778  | total loss: 

0.52308

 | time: 2.821s


| Adam | epoch: 003 | loss: 0.52308 - acc: 0.7309 -- iter: 00768/24500


Training Step: 779  | total loss: 

0.53135

 | time: 3.067s


| Adam | epoch: 003 | loss: 0.53135 - acc: 0.7235 -- iter: 00832/24500


Training Step: 780  | total loss: 

0.53567

 | time: 3.304s


| Adam | epoch: 003 | loss: 0.53567 - acc: 0.7199 -- iter: 00896/24500


Training Step: 781  | total loss: 

0.53132

 | time: 3.551s


| Adam | epoch: 003 | loss: 0.53132 - acc: 0.7229 -- iter: 00960/24500


Training Step: 782  | total loss: 

0.52817

 | time: 3.794s


| Adam | epoch: 003 | loss: 0.52817 - acc: 0.7318 -- iter: 01024/24500


Training Step: 783  | total loss: 

0.52213

 | time: 4.027s


| Adam | epoch: 003 | loss: 0.52213 - acc: 0.7383 -- iter: 01088/24500


Training Step: 784  | total loss: 

0.51567

 | time: 4.272s


| Adam | epoch: 003 | loss: 0.51567 - acc: 0.7458 -- iter: 01152/24500


Training Step: 785  | total loss: 

0.51899

 | time: 4.513s


| Adam | epoch: 003 | loss: 0.51899 - acc: 0.7384 -- iter: 01216/24500


Training Step: 786  | total loss: 

0.52403

 | time: 4.752s


| Adam | epoch: 003 | loss: 0.52403 - acc: 0.7348 -- iter: 01280/24500


Training Step: 787  | total loss: 

0.52022

 | time: 4.995s


| Adam | epoch: 003 | loss: 0.52022 - acc: 0.7364 -- iter: 01344/24500


Training Step: 788  | total loss: 

0.52735

 | time: 5.247s


| Adam | epoch: 003 | loss: 0.52735 - acc: 0.7315 -- iter: 01408/24500


Training Step: 789  | total loss: 

0.52803

 | time: 5.494s


| Adam | epoch: 003 | loss: 0.52803 - acc: 0.7318 -- iter: 01472/24500


Training Step: 790  | total loss: 

0.53355

 | time: 5.730s


| Adam | epoch: 003 | loss: 0.53355 - acc: 0.7305 -- iter: 01536/24500


Training Step: 791  | total loss: 

0.53370

 | time: 5.970s


| Adam | epoch: 003 | loss: 0.53370 - acc: 0.7340 -- iter: 01600/24500


Training Step: 792  | total loss: 

0.53101

 | time: 6.214s


| Adam | epoch: 003 | loss: 0.53101 - acc: 0.7340 -- iter: 01664/24500


Training Step: 793  | total loss: 

0.51760

 | time: 6.454s


| Adam | epoch: 003 | loss: 0.51760 - acc: 0.7466 -- iter: 01728/24500


Training Step: 794  | total loss: 

0.52660

 | time: 6.698s


| Adam | epoch: 003 | loss: 0.52660 - acc: 0.7438 -- iter: 01792/24500


Training Step: 795  | total loss: 

0.52166

 | time: 6.948s


| Adam | epoch: 003 | loss: 0.52166 - acc: 0.7444 -- iter: 01856/24500


Training Step: 796  | total loss: 

0.52686

 | time: 7.196s


| Adam | epoch: 003 | loss: 0.52686 - acc: 0.7387 -- iter: 01920/24500


Training Step: 797  | total loss: 

0.52981

 | time: 7.441s


| Adam | epoch: 003 | loss: 0.52981 - acc: 0.7398 -- iter: 01984/24500


Training Step: 798  | total loss: 

0.52415

 | time: 7.681s


| Adam | epoch: 003 | loss: 0.52415 - acc: 0.7424 -- iter: 02048/24500


Training Step: 799  | total loss: 

0.52735

 | time: 7.921s


| Adam | epoch: 003 | loss: 0.52735 - acc: 0.7369 -- iter: 02112/24500


Training Step: 800  | total loss: 

0.51923

 | time: 8.162s


| Adam | epoch: 003 | loss: 0.51923 - acc: 0.7460 -- iter: 02176/24500


Training Step: 801  | total loss: 

0.52733

 | time: 8.409s


| Adam | epoch: 003 | loss: 0.52733 - acc: 0.7449 -- iter: 02240/24500


Training Step: 802  | total loss: 

0.52098

 | time: 8.659s


| Adam | epoch: 003 | loss: 0.52098 - acc: 0.7501 -- iter: 02304/24500


Training Step: 803  | total loss: 

0.53710

 | time: 8.889s


| Adam | epoch: 003 | loss: 0.53710 - acc: 0.7344 -- iter: 02368/24500


Training Step: 804  | total loss: 

0.53859

 | time: 9.126s


| Adam | epoch: 003 | loss: 0.53859 - acc: 0.7313 -- iter: 02432/24500


Training Step: 805  | total loss: 

0.53921

 | time: 9.367s


| Adam | epoch: 003 | loss: 0.53921 - acc: 0.7254 -- iter: 02496/24500


Training Step: 806  | total loss: 

0.52960

 | time: 9.620s


| Adam | epoch: 003 | loss: 0.52960 - acc: 0.7310 -- iter: 02560/24500


Training Step: 807  | total loss: 

0.52252

 | time: 9.868s


| Adam | epoch: 003 | loss: 0.52252 - acc: 0.7313 -- iter: 02624/24500


Training Step: 808  | total loss: 

0.52435

 | time: 10.114s


| Adam | epoch: 003 | loss: 0.52435 - acc: 0.7285 -- iter: 02688/24500


Training Step: 809  | total loss: 

0.52177

 | time: 10.359s


| Adam | epoch: 003 | loss: 0.52177 - acc: 0.7259 -- iter: 02752/24500


Training Step: 810  | total loss: 

0.52292

 | time: 10.600s


| Adam | epoch: 003 | loss: 0.52292 - acc: 0.7252 -- iter: 02816/24500


Training Step: 811  | total loss: 

0.52092

 | time: 10.837s


| Adam | epoch: 003 | loss: 0.52092 - acc: 0.7293 -- iter: 02880/24500


Training Step: 812  | total loss: 

0.51570

 | time: 11.083s


| Adam | epoch: 003 | loss: 0.51570 - acc: 0.7329 -- iter: 02944/24500


Training Step: 813  | total loss: 

0.51715

 | time: 11.330s


| Adam | epoch: 003 | loss: 0.51715 - acc: 0.7315 -- iter: 03008/24500


Training Step: 814  | total loss: 

0.52257

 | time: 11.577s


| Adam | epoch: 003 | loss: 0.52257 - acc: 0.7224 -- iter: 03072/24500


Training Step: 815  | total loss: 

0.52040

 | time: 11.817s


| Adam | epoch: 003 | loss: 0.52040 - acc: 0.7252 -- iter: 03136/24500


Training Step: 816  | total loss: 

0.51997

 | time: 12.053s


| Adam | epoch: 003 | loss: 0.51997 - acc: 0.7261 -- iter: 03200/24500


Training Step: 817  | total loss: 

0.51027

 | time: 12.313s


| Adam | epoch: 003 | loss: 0.51027 - acc: 0.7363 -- iter: 03264/24500


Training Step: 818  | total loss: 

0.50533

 | time: 12.562s


| Adam | epoch: 003 | loss: 0.50533 - acc: 0.7408 -- iter: 03328/24500


Training Step: 819  | total loss: 

0.51730

 | time: 12.804s


| Adam | epoch: 003 | loss: 0.51730 - acc: 0.7401 -- iter: 03392/24500


Training Step: 820  | total loss: 

0.51307

 | time: 13.049s


| Adam | epoch: 003 | loss: 0.51307 - acc: 0.7396 -- iter: 03456/24500


Training Step: 821  | total loss: 

0.50914

 | time: 13.289s


| Adam | epoch: 003 | loss: 0.50914 - acc: 0.7469 -- iter: 03520/24500


Training Step: 822  | total loss: 

0.51036

 | time: 13.533s


| Adam | epoch: 003 | loss: 0.51036 - acc: 0.7409 -- iter: 03584/24500


Training Step: 823  | total loss: 

0.50965

 | time: 13.772s


| Adam | epoch: 003 | loss: 0.50965 - acc: 0.7403 -- iter: 03648/24500


Training Step: 824  | total loss: 

0.50489

 | time: 14.016s


| Adam | epoch: 003 | loss: 0.50489 - acc: 0.7444 -- iter: 03712/24500


Training Step: 825  | total loss: 

0.50091

 | time: 14.249s


| Adam | epoch: 003 | loss: 0.50091 - acc: 0.7496 -- iter: 03776/24500


Training Step: 826  | total loss: 

0.50011

 | time: 14.486s


| Adam | epoch: 003 | loss: 0.50011 - acc: 0.7450 -- iter: 03840/24500


Training Step: 827  | total loss: 

0.50443

 | time: 14.719s


| Adam | epoch: 003 | loss: 0.50443 - acc: 0.7392 -- iter: 03904/24500


Training Step: 828  | total loss: 

0.49609

 | time: 14.954s


| Adam | epoch: 003 | loss: 0.49609 - acc: 0.7497 -- iter: 03968/24500


Training Step: 829  | total loss: 

0.50728

 | time: 15.195s


| Adam | epoch: 003 | loss: 0.50728 - acc: 0.7466 -- iter: 04032/24500


Training Step: 830  | total loss: 

0.50012

 | time: 15.434s


| Adam | epoch: 003 | loss: 0.50012 - acc: 0.7516 -- iter: 04096/24500


Training Step: 831  | total loss: 

0.49727

 | time: 15.680s


| Adam | epoch: 003 | loss: 0.49727 - acc: 0.7514 -- iter: 04160/24500


Training Step: 832  | total loss: 

0.50318

 | time: 15.924s


| Adam | epoch: 003 | loss: 0.50318 - acc: 0.7451 -- iter: 04224/24500


Training Step: 833  | total loss: 

0.50551

 | time: 16.173s


| Adam | epoch: 003 | loss: 0.50551 - acc: 0.7440 -- iter: 04288/24500


Training Step: 834  | total loss: 

0.51061

 | time: 16.414s


| Adam | epoch: 003 | loss: 0.51061 - acc: 0.7415 -- iter: 04352/24500


Training Step: 835  | total loss: 

0.50619

 | time: 16.656s


| Adam | epoch: 003 | loss: 0.50619 - acc: 0.7470 -- iter: 04416/24500


Training Step: 836  | total loss: 

0.49209

 | time: 16.898s


| Adam | epoch: 003 | loss: 0.49209 - acc: 0.7551 -- iter: 04480/24500


Training Step: 837  | total loss: 

0.49506

 | time: 17.150s


| Adam | epoch: 003 | loss: 0.49506 - acc: 0.7530 -- iter: 04544/24500


Training Step: 838  | total loss: 

0.50342

 | time: 17.401s


| Adam | epoch: 003 | loss: 0.50342 - acc: 0.7512 -- iter: 04608/24500


Training Step: 839  | total loss: 

0.49617

 | time: 17.654s


| Adam | epoch: 003 | loss: 0.49617 - acc: 0.7573 -- iter: 04672/24500


Training Step: 840  | total loss: 

0.50476

 | time: 17.891s


| Adam | epoch: 003 | loss: 0.50476 - acc: 0.7488 -- iter: 04736/24500


Training Step: 841  | total loss: 

0.51033

 | time: 18.130s


| Adam | epoch: 003 | loss: 0.51033 - acc: 0.7520 -- iter: 04800/24500


Training Step: 842  | total loss: 

0.50998

 | time: 18.374s


| Adam | epoch: 003 | loss: 0.50998 - acc: 0.7518 -- iter: 04864/24500


Training Step: 843  | total loss: 

0.51101

 | time: 18.612s


| Adam | epoch: 003 | loss: 0.51101 - acc: 0.7516 -- iter: 04928/24500


Training Step: 844  | total loss: 

0.50980

 | time: 18.854s


| Adam | epoch: 003 | loss: 0.50980 - acc: 0.7530 -- iter: 04992/24500


Training Step: 845  | total loss: 

0.53124

 | time: 19.098s


| Adam | epoch: 003 | loss: 0.53124 - acc: 0.7340 -- iter: 05056/24500


Training Step: 846  | total loss: 

0.52049

 | time: 19.350s


| Adam | epoch: 003 | loss: 0.52049 - acc: 0.7434 -- iter: 05120/24500


Training Step: 847  | total loss: 

0.52104

 | time: 19.590s


| Adam | epoch: 003 | loss: 0.52104 - acc: 0.7456 -- iter: 05184/24500


Training Step: 848  | total loss: 

0.51482

 | time: 19.836s


| Adam | epoch: 003 | loss: 0.51482 - acc: 0.7445 -- iter: 05248/24500


Training Step: 849  | total loss: 

0.51662

 | time: 20.081s


| Adam | epoch: 003 | loss: 0.51662 - acc: 0.7419 -- iter: 05312/24500


Training Step: 850  | total loss: 

0.52451

 | time: 20.326s


| Adam | epoch: 003 | loss: 0.52451 - acc: 0.7380 -- iter: 05376/24500


Training Step: 851  | total loss: 

0.52402

 | time: 20.560s


| Adam | epoch: 003 | loss: 0.52402 - acc: 0.7408 -- iter: 05440/24500


Training Step: 852  | total loss: 

0.51244

 | time: 20.805s


| Adam | epoch: 003 | loss: 0.51244 - acc: 0.7527 -- iter: 05504/24500


Training Step: 853  | total loss: 

0.51093

 | time: 21.056s


| Adam | epoch: 003 | loss: 0.51093 - acc: 0.7571 -- iter: 05568/24500


Training Step: 854  | total loss: 

0.50323

 | time: 21.307s


| Adam | epoch: 003 | loss: 0.50323 - acc: 0.7626 -- iter: 05632/24500


Training Step: 855  | total loss: 

0.50936

 | time: 21.543s


| Adam | epoch: 003 | loss: 0.50936 - acc: 0.7598 -- iter: 05696/24500


Training Step: 856  | total loss: 

0.49607

 | time: 21.779s


| Adam | epoch: 003 | loss: 0.49607 - acc: 0.7698 -- iter: 05760/24500


Training Step: 857  | total loss: 

0.49658

 | time: 22.026s


| Adam | epoch: 003 | loss: 0.49658 - acc: 0.7678 -- iter: 05824/24500


Training Step: 858  | total loss: 

0.49489

 | time: 22.272s


| Adam | epoch: 003 | loss: 0.49489 - acc: 0.7707 -- iter: 05888/24500


Training Step: 859  | total loss: 

0.50138

 | time: 22.522s


| Adam | epoch: 003 | loss: 0.50138 - acc: 0.7702 -- iter: 05952/24500


Training Step: 860  | total loss: 

0.51077

 | time: 22.773s


| Adam | epoch: 003 | loss: 0.51077 - acc: 0.7604 -- iter: 06016/24500


Training Step: 861  | total loss: 

0.51533

 | time: 23.012s


| Adam | epoch: 003 | loss: 0.51533 - acc: 0.7609 -- iter: 06080/24500


Training Step: 862  | total loss: 

0.51789

 | time: 23.253s


| Adam | epoch: 003 | loss: 0.51789 - acc: 0.7629 -- iter: 06144/24500


Training Step: 863  | total loss: 

0.51340

 | time: 23.504s


| Adam | epoch: 003 | loss: 0.51340 - acc: 0.7632 -- iter: 06208/24500


Training Step: 864  | total loss: 

0.51857

 | time: 23.748s


| Adam | epoch: 003 | loss: 0.51857 - acc: 0.7634 -- iter: 06272/24500


Training Step: 865  | total loss: 

0.51933

 | time: 23.998s


| Adam | epoch: 003 | loss: 0.51933 - acc: 0.7590 -- iter: 06336/24500


Training Step: 866  | total loss: 

0.50723

 | time: 24.232s


| Adam | epoch: 003 | loss: 0.50723 - acc: 0.7659 -- iter: 06400/24500


Training Step: 867  | total loss: 

0.50790

 | time: 24.476s


| Adam | epoch: 003 | loss: 0.50790 - acc: 0.7627 -- iter: 06464/24500


Training Step: 868  | total loss: 

0.51223

 | time: 24.716s


| Adam | epoch: 003 | loss: 0.51223 - acc: 0.7615 -- iter: 06528/24500


Training Step: 869  | total loss: 

0.50918

 | time: 24.953s


| Adam | epoch: 003 | loss: 0.50918 - acc: 0.7572 -- iter: 06592/24500


Training Step: 870  | total loss: 

0.50989

 | time: 25.198s


| Adam | epoch: 003 | loss: 0.50989 - acc: 0.7549 -- iter: 06656/24500


Training Step: 871  | total loss: 

0.51642

 | time: 25.437s


| Adam | epoch: 003 | loss: 0.51642 - acc: 0.7560 -- iter: 06720/24500


Training Step: 872  | total loss: 

0.51476

 | time: 25.683s


| Adam | epoch: 003 | loss: 0.51476 - acc: 0.7601 -- iter: 06784/24500


Training Step: 873  | total loss: 

0.51722

 | time: 25.931s


| Adam | epoch: 003 | loss: 0.51722 - acc: 0.7544 -- iter: 06848/24500


Training Step: 874  | total loss: 

0.50708

 | time: 26.172s


| Adam | epoch: 003 | loss: 0.50708 - acc: 0.7586 -- iter: 06912/24500


Training Step: 875  | total loss: 

0.50625

 | time: 26.421s


| Adam | epoch: 003 | loss: 0.50625 - acc: 0.7593 -- iter: 06976/24500


Training Step: 876  | total loss: 

0.49530

 | time: 26.671s


| Adam | epoch: 003 | loss: 0.49530 - acc: 0.7693 -- iter: 07040/24500


Training Step: 877  | total loss: 

0.50867

 | time: 26.918s


| Adam | epoch: 003 | loss: 0.50867 - acc: 0.7596 -- iter: 07104/24500


Training Step: 878  | total loss: 

0.52046

 | time: 27.165s


| Adam | epoch: 003 | loss: 0.52046 - acc: 0.7492 -- iter: 07168/24500


Training Step: 879  | total loss: 

0.51981

 | time: 27.400s


| Adam | epoch: 003 | loss: 0.51981 - acc: 0.7431 -- iter: 07232/24500


Training Step: 880  | total loss: 

0.52993

 | time: 27.645s


| Adam | epoch: 003 | loss: 0.52993 - acc: 0.7375 -- iter: 07296/24500


Training Step: 881  | total loss: 

0.52921

 | time: 27.882s


| Adam | epoch: 003 | loss: 0.52921 - acc: 0.7372 -- iter: 07360/24500


Training Step: 882  | total loss: 

0.51985

 | time: 28.142s


| Adam | epoch: 003 | loss: 0.51985 - acc: 0.7447 -- iter: 07424/24500


Training Step: 883  | total loss: 

0.51996

 | time: 28.384s


| Adam | epoch: 003 | loss: 0.51996 - acc: 0.7499 -- iter: 07488/24500


Training Step: 884  | total loss: 

0.53039

 | time: 28.618s


| Adam | epoch: 003 | loss: 0.53039 - acc: 0.7437 -- iter: 07552/24500


Training Step: 885  | total loss: 

0.54001

 | time: 28.856s


| Adam | epoch: 003 | loss: 0.54001 - acc: 0.7334 -- iter: 07616/24500


Training Step: 886  | total loss: 

0.54052

 | time: 29.111s


| Adam | epoch: 003 | loss: 0.54052 - acc: 0.7397 -- iter: 07680/24500


Training Step: 887  | total loss: 

0.52951

 | time: 29.353s


| Adam | epoch: 003 | loss: 0.52951 - acc: 0.7455 -- iter: 07744/24500


Training Step: 888  | total loss: 

0.53725

 | time: 29.602s


| Adam | epoch: 003 | loss: 0.53725 - acc: 0.7412 -- iter: 07808/24500


Training Step: 889  | total loss: 

0.52929

 | time: 29.849s


| Adam | epoch: 003 | loss: 0.52929 - acc: 0.7484 -- iter: 07872/24500


Training Step: 890  | total loss: 

0.54028

 | time: 30.099s


| Adam | epoch: 003 | loss: 0.54028 - acc: 0.7423 -- iter: 07936/24500


Training Step: 891  | total loss: 

0.53615

 | time: 30.347s


| Adam | epoch: 003 | loss: 0.53615 - acc: 0.7462 -- iter: 08000/24500


Training Step: 892  | total loss: 

0.52955

 | time: 30.591s


| Adam | epoch: 003 | loss: 0.52955 - acc: 0.7512 -- iter: 08064/24500


Training Step: 893  | total loss: 

0.53327

 | time: 30.837s


| Adam | epoch: 003 | loss: 0.53327 - acc: 0.7511 -- iter: 08128/24500


Training Step: 894  | total loss: 

0.52102

 | time: 31.073s


| Adam | epoch: 003 | loss: 0.52102 - acc: 0.7573 -- iter: 08192/24500


Training Step: 895  | total loss: 

0.51939

 | time: 31.317s


| Adam | epoch: 003 | loss: 0.51939 - acc: 0.7612 -- iter: 08256/24500


Training Step: 896  | total loss: 

0.51210

 | time: 31.564s


| Adam | epoch: 003 | loss: 0.51210 - acc: 0.7648 -- iter: 08320/24500


Training Step: 897  | total loss: 

0.51382

 | time: 31.816s


| Adam | epoch: 003 | loss: 0.51382 - acc: 0.7633 -- iter: 08384/24500


Training Step: 898  | total loss: 

0.51441

 | time: 32.057s


| Adam | epoch: 003 | loss: 0.51441 - acc: 0.7635 -- iter: 08448/24500


Training Step: 899  | total loss: 

0.51287

 | time: 32.292s


| Adam | epoch: 003 | loss: 0.51287 - acc: 0.7637 -- iter: 08512/24500


Training Step: 900  | total loss: 

0.52714

 | time: 32.535s


| Adam | epoch: 003 | loss: 0.52714 - acc: 0.7577 -- iter: 08576/24500


Training Step: 901  | total loss: 

0.50908

 | time: 32.780s


| Adam | epoch: 003 | loss: 0.50908 - acc: 0.7663 -- iter: 08640/24500


Training Step: 902  | total loss: 

0.50564

 | time: 33.027s


| Adam | epoch: 003 | loss: 0.50564 - acc: 0.7600 -- iter: 08704/24500


Training Step: 903  | total loss: 

0.49792

 | time: 33.279s


| Adam | epoch: 003 | loss: 0.49792 - acc: 0.7683 -- iter: 08768/24500


Training Step: 904  | total loss: 

0.51034

 | time: 33.521s


| Adam | epoch: 003 | loss: 0.51034 - acc: 0.7681 -- iter: 08832/24500


Training Step: 905  | total loss: 

0.51810

 | time: 33.760s


| Adam | epoch: 003 | loss: 0.51810 - acc: 0.7663 -- iter: 08896/24500


Training Step: 906  | total loss: 

0.51758

 | time: 33.990s


| Adam | epoch: 003 | loss: 0.51758 - acc: 0.7631 -- iter: 08960/24500


Training Step: 907  | total loss: 

0.50263

 | time: 34.228s


| Adam | epoch: 003 | loss: 0.50263 - acc: 0.7680 -- iter: 09024/24500


Training Step: 908  | total loss: 

0.50720

 | time: 34.468s


| Adam | epoch: 003 | loss: 0.50720 - acc: 0.7584 -- iter: 09088/24500


Training Step: 909  | total loss: 

0.50797

 | time: 34.707s


| Adam | epoch: 003 | loss: 0.50797 - acc: 0.7623 -- iter: 09152/24500


Training Step: 910  | total loss: 

0.51543

 | time: 34.960s


| Adam | epoch: 003 | loss: 0.51543 - acc: 0.7563 -- iter: 09216/24500


Training Step: 911  | total loss: 

0.51106

 | time: 35.196s


| Adam | epoch: 003 | loss: 0.51106 - acc: 0.7604 -- iter: 09280/24500


Training Step: 912  | total loss: 

0.50472

 | time: 35.436s


| Adam | epoch: 003 | loss: 0.50472 - acc: 0.7609 -- iter: 09344/24500


Training Step: 913  | total loss: 

0.50187

 | time: 35.671s


| Adam | epoch: 003 | loss: 0.50187 - acc: 0.7583 -- iter: 09408/24500


Training Step: 914  | total loss: 

0.49934

 | time: 35.905s


| Adam | epoch: 003 | loss: 0.49934 - acc: 0.7621 -- iter: 09472/24500


Training Step: 915  | total loss: 

0.48926

 | time: 36.153s


| Adam | epoch: 003 | loss: 0.48926 - acc: 0.7687 -- iter: 09536/24500


Training Step: 916  | total loss: 

0.49568

 | time: 36.408s


| Adam | epoch: 003 | loss: 0.49568 - acc: 0.7684 -- iter: 09600/24500


Training Step: 917  | total loss: 

0.49960

 | time: 36.648s


| Adam | epoch: 003 | loss: 0.49960 - acc: 0.7681 -- iter: 09664/24500


Training Step: 918  | total loss: 

0.49149

 | time: 36.901s


| Adam | epoch: 003 | loss: 0.49149 - acc: 0.7694 -- iter: 09728/24500


Training Step: 919  | total loss: 

0.50511

 | time: 37.139s


| Adam | epoch: 003 | loss: 0.50511 - acc: 0.7597 -- iter: 09792/24500


Training Step: 920  | total loss: 

0.50568

 | time: 37.381s


| Adam | epoch: 003 | loss: 0.50568 - acc: 0.7587 -- iter: 09856/24500


Training Step: 921  | total loss: 

0.49731

 | time: 37.626s


| Adam | epoch: 003 | loss: 0.49731 - acc: 0.7657 -- iter: 09920/24500


Training Step: 922  | total loss: 

0.49322

 | time: 37.869s


| Adam | epoch: 003 | loss: 0.49322 - acc: 0.7703 -- iter: 09984/24500


Training Step: 923  | total loss: 

0.49103

 | time: 38.122s


| Adam | epoch: 003 | loss: 0.49103 - acc: 0.7714 -- iter: 10048/24500


Training Step: 924  | total loss: 

0.50075

 | time: 38.360s


| Adam | epoch: 003 | loss: 0.50075 - acc: 0.7615 -- iter: 10112/24500


Training Step: 925  | total loss: 

0.49656

 | time: 38.604s


| Adam | epoch: 003 | loss: 0.49656 - acc: 0.7635 -- iter: 10176/24500


Training Step: 926  | total loss: 

0.50239

 | time: 38.851s


| Adam | epoch: 003 | loss: 0.50239 - acc: 0.7621 -- iter: 10240/24500


Training Step: 927  | total loss: 

0.50769

 | time: 39.098s


| Adam | epoch: 003 | loss: 0.50769 - acc: 0.7578 -- iter: 10304/24500


Training Step: 928  | total loss: 

0.50009

 | time: 39.341s


| Adam | epoch: 003 | loss: 0.50009 - acc: 0.7648 -- iter: 10368/24500


Training Step: 929  | total loss: 

0.50428

 | time: 39.580s


| Adam | epoch: 003 | loss: 0.50428 - acc: 0.7649 -- iter: 10432/24500


Training Step: 930  | total loss: 

0.50818

 | time: 39.824s


| Adam | epoch: 003 | loss: 0.50818 - acc: 0.7618 -- iter: 10496/24500


Training Step: 931  | total loss: 

0.51000

 | time: 40.075s


| Adam | epoch: 003 | loss: 0.51000 - acc: 0.7591 -- iter: 10560/24500


Training Step: 932  | total loss: 

0.50504

 | time: 40.320s


| Adam | epoch: 003 | loss: 0.50504 - acc: 0.7597 -- iter: 10624/24500


Training Step: 933  | total loss: 

0.50764

 | time: 40.556s


| Adam | epoch: 003 | loss: 0.50764 - acc: 0.7556 -- iter: 10688/24500


Training Step: 934  | total loss: 

0.50037

 | time: 40.811s


| Adam | epoch: 003 | loss: 0.50037 - acc: 0.7613 -- iter: 10752/24500


Training Step: 935  | total loss: 

0.50260

 | time: 41.048s


| Adam | epoch: 003 | loss: 0.50260 - acc: 0.7539 -- iter: 10816/24500


Training Step: 936  | total loss: 

0.49775

 | time: 41.291s


| Adam | epoch: 003 | loss: 0.49775 - acc: 0.7536 -- iter: 10880/24500


Training Step: 937  | total loss: 

0.50194

 | time: 41.541s


| Adam | epoch: 003 | loss: 0.50194 - acc: 0.7469 -- iter: 10944/24500


Training Step: 938  | total loss: 

0.50883

 | time: 41.783s


| Adam | epoch: 003 | loss: 0.50883 - acc: 0.7426 -- iter: 11008/24500


Training Step: 939  | total loss: 

0.52161

 | time: 42.026s


| Adam | epoch: 003 | loss: 0.52161 - acc: 0.7324 -- iter: 11072/24500


Training Step: 940  | total loss: 

0.51568

 | time: 42.276s


| Adam | epoch: 003 | loss: 0.51568 - acc: 0.7357 -- iter: 11136/24500


Training Step: 941  | total loss: 

0.52825

 | time: 42.520s


| Adam | epoch: 003 | loss: 0.52825 - acc: 0.7293 -- iter: 11200/24500


Training Step: 942  | total loss: 

0.52165

 | time: 42.758s


| Adam | epoch: 003 | loss: 0.52165 - acc: 0.7361 -- iter: 11264/24500


Training Step: 943  | total loss: 

0.51922

 | time: 42.993s


| Adam | epoch: 003 | loss: 0.51922 - acc: 0.7343 -- iter: 11328/24500


Training Step: 944  | total loss: 

0.51459

 | time: 43.231s


| Adam | epoch: 003 | loss: 0.51459 - acc: 0.7422 -- iter: 11392/24500


Training Step: 945  | total loss: 

0.50962

 | time: 43.472s


| Adam | epoch: 003 | loss: 0.50962 - acc: 0.7492 -- iter: 11456/24500


Training Step: 946  | total loss: 

0.50880

 | time: 43.719s


| Adam | epoch: 003 | loss: 0.50880 - acc: 0.7508 -- iter: 11520/24500


Training Step: 947  | total loss: 

0.49905

 | time: 43.967s


| Adam | epoch: 003 | loss: 0.49905 - acc: 0.7570 -- iter: 11584/24500


Training Step: 948  | total loss: 

0.50462

 | time: 44.214s


| Adam | epoch: 003 | loss: 0.50462 - acc: 0.7500 -- iter: 11648/24500


Training Step: 949  | total loss: 

0.49247

 | time: 44.453s


| Adam | epoch: 003 | loss: 0.49247 - acc: 0.7594 -- iter: 11712/24500


Training Step: 950  | total loss: 

0.49544

 | time: 44.692s


| Adam | epoch: 003 | loss: 0.49544 - acc: 0.7569 -- iter: 11776/24500


Training Step: 951  | total loss: 

0.50481

 | time: 44.935s


| Adam | epoch: 003 | loss: 0.50481 - acc: 0.7531 -- iter: 11840/24500


Training Step: 952  | total loss: 

0.51330

 | time: 45.174s


| Adam | epoch: 003 | loss: 0.51330 - acc: 0.7465 -- iter: 11904/24500


Training Step: 953  | total loss: 

0.51646

 | time: 45.423s


| Adam | epoch: 003 | loss: 0.51646 - acc: 0.7469 -- iter: 11968/24500


Training Step: 954  | total loss: 

0.51503

 | time: 45.664s


| Adam | epoch: 003 | loss: 0.51503 - acc: 0.7425 -- iter: 12032/24500


Training Step: 955  | total loss: 

0.52567

 | time: 45.909s


| Adam | epoch: 003 | loss: 0.52567 - acc: 0.7401 -- iter: 12096/24500


Training Step: 956  | total loss: 

0.51382

 | time: 46.149s


| Adam | epoch: 003 | loss: 0.51382 - acc: 0.7427 -- iter: 12160/24500


Training Step: 957  | total loss: 

0.51100

 | time: 46.396s


| Adam | epoch: 003 | loss: 0.51100 - acc: 0.7481 -- iter: 12224/24500


Training Step: 958  | total loss: 

0.51591

 | time: 46.641s


| Adam | epoch: 003 | loss: 0.51591 - acc: 0.7436 -- iter: 12288/24500


Training Step: 959  | total loss: 

0.52049

 | time: 46.875s


| Adam | epoch: 003 | loss: 0.52049 - acc: 0.7396 -- iter: 12352/24500


Training Step: 960  | total loss: 

0.50457

 | time: 47.115s


| Adam | epoch: 003 | loss: 0.50457 - acc: 0.7484 -- iter: 12416/24500


Training Step: 961  | total loss: 

0.49830

 | time: 47.363s


| Adam | epoch: 003 | loss: 0.49830 - acc: 0.7501 -- iter: 12480/24500


Training Step: 962  | total loss: 

0.50506

 | time: 47.607s


| Adam | epoch: 003 | loss: 0.50506 - acc: 0.7439 -- iter: 12544/24500


Training Step: 963  | total loss: 

0.50946

 | time: 47.853s


| Adam | epoch: 003 | loss: 0.50946 - acc: 0.7460 -- iter: 12608/24500


Training Step: 964  | total loss: 

0.51865

 | time: 48.096s


| Adam | epoch: 003 | loss: 0.51865 - acc: 0.7386 -- iter: 12672/24500


Training Step: 965  | total loss: 

0.52115

 | time: 48.320s


| Adam | epoch: 003 | loss: 0.52115 - acc: 0.7398 -- iter: 12736/24500


Training Step: 966  | total loss: 

0.52231

 | time: 48.569s


| Adam | epoch: 003 | loss: 0.52231 - acc: 0.7392 -- iter: 12800/24500


Training Step: 967  | total loss: 

0.51078

 | time: 48.814s


| Adam | epoch: 003 | loss: 0.51078 - acc: 0.7544 -- iter: 12864/24500


Training Step: 968  | total loss: 

0.51689

 | time: 49.057s


| Adam | epoch: 003 | loss: 0.51689 - acc: 0.7539 -- iter: 12928/24500


Training Step: 969  | total loss: 

0.51570

 | time: 49.292s


| Adam | epoch: 003 | loss: 0.51570 - acc: 0.7535 -- iter: 12992/24500


Training Step: 970  | total loss: 

0.51258

 | time: 49.536s


| Adam | epoch: 003 | loss: 0.51258 - acc: 0.7547 -- iter: 13056/24500


Training Step: 971  | total loss: 

0.50981

 | time: 49.788s


| Adam | epoch: 003 | loss: 0.50981 - acc: 0.7590 -- iter: 13120/24500


Training Step: 972  | total loss: 

0.50696

 | time: 50.046s


| Adam | epoch: 003 | loss: 0.50696 - acc: 0.7612 -- iter: 13184/24500


Training Step: 973  | total loss: 

0.50314

 | time: 50.294s


| Adam | epoch: 003 | loss: 0.50314 - acc: 0.7648 -- iter: 13248/24500


Training Step: 974  | total loss: 

0.50158

 | time: 50.545s


| Adam | epoch: 003 | loss: 0.50158 - acc: 0.7648 -- iter: 13312/24500


Training Step: 975  | total loss: 

0.49800

 | time: 50.782s


| Adam | epoch: 003 | loss: 0.49800 - acc: 0.7680 -- iter: 13376/24500


Training Step: 976  | total loss: 

0.49201

 | time: 51.030s


| Adam | epoch: 003 | loss: 0.49201 - acc: 0.7647 -- iter: 13440/24500


Training Step: 977  | total loss: 

0.48282

 | time: 51.272s


| Adam | epoch: 003 | loss: 0.48282 - acc: 0.7741 -- iter: 13504/24500


Training Step: 978  | total loss: 

0.49185

 | time: 51.517s


| Adam | epoch: 003 | loss: 0.49185 - acc: 0.7686 -- iter: 13568/24500


Training Step: 979  | total loss: 

0.49311

 | time: 51.748s


| Adam | epoch: 003 | loss: 0.49311 - acc: 0.7699 -- iter: 13632/24500


Training Step: 980  | total loss: 

0.50291

 | time: 51.984s


| Adam | epoch: 003 | loss: 0.50291 - acc: 0.7663 -- iter: 13696/24500


Training Step: 981  | total loss: 

0.50264

 | time: 52.228s


| Adam | epoch: 003 | loss: 0.50264 - acc: 0.7694 -- iter: 13760/24500


Training Step: 982  | total loss: 

0.50153

 | time: 52.468s


| Adam | epoch: 003 | loss: 0.50153 - acc: 0.7674 -- iter: 13824/24500


Training Step: 983  | total loss: 

0.50290

 | time: 52.715s


| Adam | epoch: 003 | loss: 0.50290 - acc: 0.7704 -- iter: 13888/24500


Training Step: 984  | total loss: 

0.48482

 | time: 52.964s


| Adam | epoch: 003 | loss: 0.48482 - acc: 0.7808 -- iter: 13952/24500


Training Step: 985  | total loss: 

0.47631

 | time: 53.208s


| Adam | epoch: 003 | loss: 0.47631 - acc: 0.7871 -- iter: 14016/24500


Training Step: 986  | total loss: 

0.47490

 | time: 53.451s


| Adam | epoch: 003 | loss: 0.47490 - acc: 0.7865 -- iter: 14080/24500


Training Step: 987  | total loss: 

0.48330

 | time: 53.697s


| Adam | epoch: 003 | loss: 0.48330 - acc: 0.7751 -- iter: 14144/24500


Training Step: 988  | total loss: 

0.50068

 | time: 53.946s


| Adam | epoch: 003 | loss: 0.50068 - acc: 0.7663 -- iter: 14208/24500


Training Step: 989  | total loss: 

0.50908

 | time: 54.195s


| Adam | epoch: 003 | loss: 0.50908 - acc: 0.7631 -- iter: 14272/24500


Training Step: 990  | total loss: 

0.51449

 | time: 54.432s


| Adam | epoch: 003 | loss: 0.51449 - acc: 0.7618 -- iter: 14336/24500


Training Step: 991  | total loss: 

0.51419

 | time: 54.673s


| Adam | epoch: 003 | loss: 0.51419 - acc: 0.7591 -- iter: 14400/24500


Training Step: 992  | total loss: 

0.50750

 | time: 54.926s


| Adam | epoch: 003 | loss: 0.50750 - acc: 0.7644 -- iter: 14464/24500


Training Step: 993  | total loss: 

0.50515

 | time: 55.171s


| Adam | epoch: 003 | loss: 0.50515 - acc: 0.7677 -- iter: 14528/24500


Training Step: 994  | total loss: 

0.51944

 | time: 55.418s


| Adam | epoch: 003 | loss: 0.51944 - acc: 0.7612 -- iter: 14592/24500


Training Step: 995  | total loss: 

0.53611

 | time: 55.658s


| Adam | epoch: 003 | loss: 0.53611 - acc: 0.7523 -- iter: 14656/24500


Training Step: 996  | total loss: 

0.53366

 | time: 55.905s


| Adam | epoch: 003 | loss: 0.53366 - acc: 0.7567 -- iter: 14720/24500


Training Step: 997  | total loss: 

0.53798

 | time: 56.150s


| Adam | epoch: 003 | loss: 0.53798 - acc: 0.7514 -- iter: 14784/24500


Training Step: 998  | total loss: 

0.54644

 | time: 56.390s


| Adam | epoch: 003 | loss: 0.54644 - acc: 0.7465 -- iter: 14848/24500


Training Step: 999  | total loss: 

0.54254

 | time: 56.636s


| Adam | epoch: 003 | loss: 0.54254 - acc: 0.7485 -- iter: 14912/24500


Training Step: 1000  | total loss: 

0.54400

 | time: 57.887s


| Adam | epoch: 003 | loss: 0.54400 - acc: 0.7377 | val_loss: 0.54847 - val_acc: 0.7400 -- iter: 14976/24500
--


Training Step: 1001  | total loss: 

0.54507

 | time: 58.134s


| Adam | epoch: 003 | loss: 0.54507 - acc: 0.7358 -- iter: 15040/24500


Training Step: 1002  | total loss: 

0.53942

 | time: 58.381s


| Adam | epoch: 003 | loss: 0.53942 - acc: 0.7372 -- iter: 15104/24500


Training Step: 1003  | total loss: 

0.53367

 | time: 58.625s


| Adam | epoch: 003 | loss: 0.53367 - acc: 0.7432 -- iter: 15168/24500


Training Step: 1004  | total loss: 

0.53639

 | time: 58.864s


| Adam | epoch: 003 | loss: 0.53639 - acc: 0.7470 -- iter: 15232/24500


Training Step: 1005  | total loss: 

0.54114

 | time: 59.111s


| Adam | epoch: 003 | loss: 0.54114 - acc: 0.7332 -- iter: 15296/24500


Training Step: 1006  | total loss: 

0.53988

 | time: 59.352s


| Adam | epoch: 003 | loss: 0.53988 - acc: 0.7333 -- iter: 15360/24500


Training Step: 1007  | total loss: 

0.53403

 | time: 59.588s


| Adam | epoch: 003 | loss: 0.53403 - acc: 0.7319 -- iter: 15424/24500


Training Step: 1008  | total loss: 

0.53505

 | time: 59.841s


| Adam | epoch: 003 | loss: 0.53505 - acc: 0.7337 -- iter: 15488/24500


Training Step: 1009  | total loss: 

0.53788

 | time: 60.083s


| Adam | epoch: 003 | loss: 0.53788 - acc: 0.7291 -- iter: 15552/24500


Training Step: 1010  | total loss: 

0.53745

 | time: 60.317s


| Adam | epoch: 003 | loss: 0.53745 - acc: 0.7343 -- iter: 15616/24500


Training Step: 1011  | total loss: 

0.54078

 | time: 60.562s


| Adam | epoch: 003 | loss: 0.54078 - acc: 0.7327 -- iter: 15680/24500


Training Step: 1012  | total loss: 

0.54198

 | time: 60.803s


| Adam | epoch: 003 | loss: 0.54198 - acc: 0.7313 -- iter: 15744/24500


Training Step: 1013  | total loss: 

0.54095

 | time: 61.055s


| Adam | epoch: 003 | loss: 0.54095 - acc: 0.7332 -- iter: 15808/24500


Training Step: 1014  | total loss: 

0.54253

 | time: 61.299s


| Adam | epoch: 003 | loss: 0.54253 - acc: 0.7318 -- iter: 15872/24500


Training Step: 1015  | total loss: 

0.53684

 | time: 61.552s


| Adam | epoch: 003 | loss: 0.53684 - acc: 0.7351 -- iter: 15936/24500


Training Step: 1016  | total loss: 

0.53747

 | time: 61.798s


| Adam | epoch: 003 | loss: 0.53747 - acc: 0.7366 -- iter: 16000/24500


Training Step: 1017  | total loss: 

0.53765

 | time: 62.054s


| Adam | epoch: 003 | loss: 0.53765 - acc: 0.7348 -- iter: 16064/24500


Training Step: 1018  | total loss: 

0.53496

 | time: 62.287s


| Adam | epoch: 003 | loss: 0.53496 - acc: 0.7332 -- iter: 16128/24500


Training Step: 1019  | total loss: 

0.52779

 | time: 62.533s


| Adam | epoch: 003 | loss: 0.52779 - acc: 0.7427 -- iter: 16192/24500


Training Step: 1020  | total loss: 

0.52059

 | time: 62.785s


| Adam | epoch: 003 | loss: 0.52059 - acc: 0.7497 -- iter: 16256/24500


Training Step: 1021  | total loss: 

0.51359

 | time: 63.041s


| Adam | epoch: 003 | loss: 0.51359 - acc: 0.7497 -- iter: 16320/24500


Training Step: 1022  | total loss: 

0.51120

 | time: 63.293s


| Adam | epoch: 003 | loss: 0.51120 - acc: 0.7513 -- iter: 16384/24500


Training Step: 1023  | total loss: 

0.50616

 | time: 63.538s


| Adam | epoch: 003 | loss: 0.50616 - acc: 0.7527 -- iter: 16448/24500


Training Step: 1024  | total loss: 

0.50592

 | time: 63.784s


| Adam | epoch: 003 | loss: 0.50592 - acc: 0.7509 -- iter: 16512/24500


Training Step: 1025  | total loss: 

0.49460

 | time: 64.027s


| Adam | epoch: 003 | loss: 0.49460 - acc: 0.7555 -- iter: 16576/24500


Training Step: 1026  | total loss: 

0.50416

 | time: 64.270s


| Adam | epoch: 003 | loss: 0.50416 - acc: 0.7518 -- iter: 16640/24500


Training Step: 1027  | total loss: 

0.50504

 | time: 64.519s


| Adam | epoch: 003 | loss: 0.50504 - acc: 0.7501 -- iter: 16704/24500


Training Step: 1028  | total loss: 

0.50028

 | time: 64.768s


| Adam | epoch: 003 | loss: 0.50028 - acc: 0.7548 -- iter: 16768/24500


Training Step: 1029  | total loss: 

0.49776

 | time: 65.019s


| Adam | epoch: 003 | loss: 0.49776 - acc: 0.7574 -- iter: 16832/24500


Training Step: 1030  | total loss: 

0.51733

 | time: 65.258s


| Adam | epoch: 003 | loss: 0.51733 - acc: 0.7473 -- iter: 16896/24500


Training Step: 1031  | total loss: 

0.50926

 | time: 65.512s


| Adam | epoch: 003 | loss: 0.50926 - acc: 0.7491 -- iter: 16960/24500


Training Step: 1032  | total loss: 

0.51099

 | time: 65.752s


| Adam | epoch: 003 | loss: 0.51099 - acc: 0.7523 -- iter: 17024/24500


Training Step: 1033  | total loss: 

0.52764

 | time: 66.002s


| Adam | epoch: 003 | loss: 0.52764 - acc: 0.7474 -- iter: 17088/24500


Training Step: 1034  | total loss: 

0.54177

 | time: 66.252s


| Adam | epoch: 003 | loss: 0.54177 - acc: 0.7367 -- iter: 17152/24500


Training Step: 1035  | total loss: 

0.53970

 | time: 66.493s


| Adam | epoch: 003 | loss: 0.53970 - acc: 0.7365 -- iter: 17216/24500


Training Step: 1036  | total loss: 

0.53089

 | time: 66.741s


| Adam | epoch: 003 | loss: 0.53089 - acc: 0.7394 -- iter: 17280/24500


Training Step: 1037  | total loss: 

0.52132

 | time: 66.993s


| Adam | epoch: 003 | loss: 0.52132 - acc: 0.7483 -- iter: 17344/24500


Training Step: 1038  | total loss: 

0.51451

 | time: 67.237s


| Adam | epoch: 003 | loss: 0.51451 - acc: 0.7563 -- iter: 17408/24500


Training Step: 1039  | total loss: 

0.50526

 | time: 67.474s


| Adam | epoch: 003 | loss: 0.50526 - acc: 0.7666 -- iter: 17472/24500


Training Step: 1040  | total loss: 

0.50575

 | time: 67.713s


| Adam | epoch: 003 | loss: 0.50575 - acc: 0.7696 -- iter: 17536/24500


Training Step: 1041  | total loss: 

0.51803

 | time: 67.961s


| Adam | epoch: 003 | loss: 0.51803 - acc: 0.7630 -- iter: 17600/24500


Training Step: 1042  | total loss: 

0.52624

 | time: 68.221s


| Adam | epoch: 003 | loss: 0.52624 - acc: 0.7554 -- iter: 17664/24500


Training Step: 1043  | total loss: 

0.52599

 | time: 68.463s


| Adam | epoch: 003 | loss: 0.52599 - acc: 0.7627 -- iter: 17728/24500


Training Step: 1044  | total loss: 

0.51846

 | time: 68.704s


| Adam | epoch: 003 | loss: 0.51846 - acc: 0.7630 -- iter: 17792/24500


Training Step: 1045  | total loss: 

0.51513

 | time: 68.962s


| Adam | epoch: 003 | loss: 0.51513 - acc: 0.7648 -- iter: 17856/24500


Training Step: 1046  | total loss: 

0.52936

 | time: 69.209s


| Adam | epoch: 003 | loss: 0.52936 - acc: 0.7555 -- iter: 17920/24500


Training Step: 1047  | total loss: 

0.53606

 | time: 69.454s


| Adam | epoch: 003 | loss: 0.53606 - acc: 0.7534 -- iter: 17984/24500


Training Step: 1048  | total loss: 

0.52536

 | time: 69.690s


| Adam | epoch: 003 | loss: 0.52536 - acc: 0.7609 -- iter: 18048/24500


Training Step: 1049  | total loss: 

0.51856

 | time: 69.934s


| Adam | epoch: 003 | loss: 0.51856 - acc: 0.7676 -- iter: 18112/24500


Training Step: 1050  | total loss: 

0.52162

 | time: 70.178s


| Adam | epoch: 003 | loss: 0.52162 - acc: 0.7627 -- iter: 18176/24500


Training Step: 1051  | total loss: 

0.51888

 | time: 70.429s


| Adam | epoch: 003 | loss: 0.51888 - acc: 0.7630 -- iter: 18240/24500


Training Step: 1052  | total loss: 

0.51233

 | time: 70.667s


| Adam | epoch: 003 | loss: 0.51233 - acc: 0.7695 -- iter: 18304/24500


Training Step: 1053  | total loss: 

0.50687

 | time: 70.905s


| Adam | epoch: 003 | loss: 0.50687 - acc: 0.7707 -- iter: 18368/24500


Training Step: 1054  | total loss: 

0.51068

 | time: 71.143s


| Adam | epoch: 003 | loss: 0.51068 - acc: 0.7686 -- iter: 18432/24500


Training Step: 1055  | total loss: 

0.51221

 | time: 71.387s


| Adam | epoch: 003 | loss: 0.51221 - acc: 0.7589 -- iter: 18496/24500


Training Step: 1056  | total loss: 

0.50849

 | time: 71.637s


| Adam | epoch: 003 | loss: 0.50849 - acc: 0.7534 -- iter: 18560/24500


Training Step: 1057  | total loss: 

0.49849

 | time: 71.879s


| Adam | epoch: 003 | loss: 0.49849 - acc: 0.7608 -- iter: 18624/24500


Training Step: 1058  | total loss: 

0.48290

 | time: 72.130s


| Adam | epoch: 003 | loss: 0.48290 - acc: 0.7707 -- iter: 18688/24500


Training Step: 1059  | total loss: 

0.49214

 | time: 72.382s


| Adam | epoch: 003 | loss: 0.49214 - acc: 0.7702 -- iter: 18752/24500


Training Step: 1060  | total loss: 

0.48883

 | time: 72.627s


| Adam | epoch: 003 | loss: 0.48883 - acc: 0.7697 -- iter: 18816/24500


Training Step: 1061  | total loss: 

0.50018

 | time: 72.869s


| Adam | epoch: 003 | loss: 0.50018 - acc: 0.7599 -- iter: 18880/24500


Training Step: 1062  | total loss: 

0.49762

 | time: 73.119s


| Adam | epoch: 003 | loss: 0.49762 - acc: 0.7621 -- iter: 18944/24500


Training Step: 1063  | total loss: 

0.49853

 | time: 73.369s


| Adam | epoch: 003 | loss: 0.49853 - acc: 0.7577 -- iter: 19008/24500


Training Step: 1064  | total loss: 

0.50258

 | time: 73.607s


| Adam | epoch: 003 | loss: 0.50258 - acc: 0.7507 -- iter: 19072/24500


Training Step: 1065  | total loss: 

0.50287

 | time: 73.853s


| Adam | epoch: 003 | loss: 0.50287 - acc: 0.7538 -- iter: 19136/24500


Training Step: 1066  | total loss: 

0.49478

 | time: 74.094s


| Adam | epoch: 003 | loss: 0.49478 - acc: 0.7565 -- iter: 19200/24500


Training Step: 1067  | total loss: 

0.49503

 | time: 74.345s


| Adam | epoch: 003 | loss: 0.49503 - acc: 0.7481 -- iter: 19264/24500


Training Step: 1068  | total loss: 

0.49794

 | time: 74.587s


| Adam | epoch: 003 | loss: 0.49794 - acc: 0.7420 -- iter: 19328/24500


Training Step: 1069  | total loss: 

0.48969

 | time: 74.831s


| Adam | epoch: 003 | loss: 0.48969 - acc: 0.7475 -- iter: 19392/24500


Training Step: 1070  | total loss: 

0.48847

 | time: 75.077s


| Adam | epoch: 003 | loss: 0.48847 - acc: 0.7446 -- iter: 19456/24500


Training Step: 1071  | total loss: 

0.48884

 | time: 75.312s


| Adam | epoch: 003 | loss: 0.48884 - acc: 0.7436 -- iter: 19520/24500


Training Step: 1072  | total loss: 

0.48741

 | time: 75.553s


| Adam | epoch: 003 | loss: 0.48741 - acc: 0.7489 -- iter: 19584/24500


Training Step: 1073  | total loss: 

0.48725

 | time: 75.787s


| Adam | epoch: 003 | loss: 0.48725 - acc: 0.7459 -- iter: 19648/24500


Training Step: 1074  | total loss: 

0.48552

 | time: 76.031s


| Adam | epoch: 003 | loss: 0.48552 - acc: 0.7526 -- iter: 19712/24500


Training Step: 1075  | total loss: 

0.48566

 | time: 76.277s


| Adam | epoch: 003 | loss: 0.48566 - acc: 0.7492 -- iter: 19776/24500


Training Step: 1076  | total loss: 

0.49796

 | time: 76.530s


| Adam | epoch: 003 | loss: 0.49796 - acc: 0.7461 -- iter: 19840/24500


Training Step: 1077  | total loss: 

0.49534

 | time: 76.782s


| Adam | epoch: 003 | loss: 0.49534 - acc: 0.7512 -- iter: 19904/24500


Training Step: 1078  | total loss: 

0.48811

 | time: 77.029s


| Adam | epoch: 003 | loss: 0.48811 - acc: 0.7605 -- iter: 19968/24500


Training Step: 1079  | total loss: 

0.49352

 | time: 77.267s


| Adam | epoch: 003 | loss: 0.49352 - acc: 0.7610 -- iter: 20032/24500


Training Step: 1080  | total loss: 

0.48854

 | time: 77.516s


| Adam | epoch: 003 | loss: 0.48854 - acc: 0.7630 -- iter: 20096/24500


Training Step: 1081  | total loss: 

0.48369

 | time: 77.767s


| Adam | epoch: 003 | loss: 0.48369 - acc: 0.7695 -- iter: 20160/24500


Training Step: 1082  | total loss: 

0.47446

 | time: 78.015s


| Adam | epoch: 003 | loss: 0.47446 - acc: 0.7707 -- iter: 20224/24500


Training Step: 1083  | total loss: 

0.46599

 | time: 78.252s


| Adam | epoch: 003 | loss: 0.46599 - acc: 0.7796 -- iter: 20288/24500


Training Step: 1084  | total loss: 

0.49265

 | time: 78.510s


| Adam | epoch: 003 | loss: 0.49265 - acc: 0.7704 -- iter: 20352/24500


Training Step: 1085  | total loss: 

0.49330

 | time: 78.755s


| Adam | epoch: 003 | loss: 0.49330 - acc: 0.7761 -- iter: 20416/24500


Training Step: 1086  | total loss: 

0.48916

 | time: 79.001s


| Adam | epoch: 003 | loss: 0.48916 - acc: 0.7782 -- iter: 20480/24500


Training Step: 1087  | total loss: 

0.48027

 | time: 79.241s


| Adam | epoch: 003 | loss: 0.48027 - acc: 0.7832 -- iter: 20544/24500


Training Step: 1088  | total loss: 

0.47835

 | time: 79.489s


| Adam | epoch: 003 | loss: 0.47835 - acc: 0.7783 -- iter: 20608/24500


Training Step: 1089  | total loss: 

0.48095

 | time: 79.724s


| Adam | epoch: 003 | loss: 0.48095 - acc: 0.7755 -- iter: 20672/24500


Training Step: 1090  | total loss: 

0.47821

 | time: 79.975s


| Adam | epoch: 003 | loss: 0.47821 - acc: 0.7776 -- iter: 20736/24500


Training Step: 1091  | total loss: 

0.48460

 | time: 80.217s


| Adam | epoch: 003 | loss: 0.48460 - acc: 0.7780 -- iter: 20800/24500


Training Step: 1092  | total loss: 

0.48372

 | time: 80.472s


| Adam | epoch: 003 | loss: 0.48372 - acc: 0.7767 -- iter: 20864/24500


Training Step: 1093  | total loss: 

0.48179

 | time: 80.715s


| Adam | epoch: 003 | loss: 0.48179 - acc: 0.7788 -- iter: 20928/24500


Training Step: 1094  | total loss: 

0.47079

 | time: 80.957s


| Adam | epoch: 003 | loss: 0.47079 - acc: 0.7853 -- iter: 20992/24500


Training Step: 1095  | total loss: 

0.47281

 | time: 81.194s


| Adam | epoch: 003 | loss: 0.47281 - acc: 0.7849 -- iter: 21056/24500


Training Step: 1096  | total loss: 

0.47820

 | time: 81.442s


| Adam | epoch: 003 | loss: 0.47820 - acc: 0.7829 -- iter: 21120/24500


Training Step: 1097  | total loss: 

0.47089

 | time: 81.685s


| Adam | epoch: 003 | loss: 0.47089 - acc: 0.7875 -- iter: 21184/24500


Training Step: 1098  | total loss: 

0.47749

 | time: 81.932s


| Adam | epoch: 003 | loss: 0.47749 - acc: 0.7821 -- iter: 21248/24500


Training Step: 1099  | total loss: 

0.48014

 | time: 82.192s


| Adam | epoch: 003 | loss: 0.48014 - acc: 0.7805 -- iter: 21312/24500


Training Step: 1100  | total loss: 

0.48348

 | time: 82.487s


| Adam | epoch: 003 | loss: 0.48348 - acc: 0.7790 -- iter: 21376/24500


Training Step: 1101  | total loss: 

0.48344

 | time: 82.770s


| Adam | epoch: 003 | loss: 0.48344 - acc: 0.7777 -- iter: 21440/24500


Training Step: 1102  | total loss: 

0.47705

 | time: 83.070s


| Adam | epoch: 003 | loss: 0.47705 - acc: 0.7812 -- iter: 21504/24500


Training Step: 1103  | total loss: 

0.48844

 | time: 83.337s


| Adam | epoch: 003 | loss: 0.48844 - acc: 0.7749 -- iter: 21568/24500


Training Step: 1104  | total loss: 

0.50008

 | time: 83.624s


| Adam | epoch: 003 | loss: 0.50008 - acc: 0.7724 -- iter: 21632/24500


Training Step: 1105  | total loss: 

0.50353

 | time: 83.895s


| Adam | epoch: 003 | loss: 0.50353 - acc: 0.7686 -- iter: 21696/24500


Training Step: 1106  | total loss: 

0.49565

 | time: 84.175s


| Adam | epoch: 003 | loss: 0.49565 - acc: 0.7730 -- iter: 21760/24500


Training Step: 1107  | total loss: 

0.49872

 | time: 84.461s


| Adam | epoch: 003 | loss: 0.49872 - acc: 0.7723 -- iter: 21824/24500


Training Step: 1108  | total loss: 

0.50137

 | time: 84.725s


| Adam | epoch: 003 | loss: 0.50137 - acc: 0.7622 -- iter: 21888/24500


Training Step: 1109  | total loss: 

0.51170

 | time: 84.995s


| Adam | epoch: 003 | loss: 0.51170 - acc: 0.7579 -- iter: 21952/24500


Training Step: 1110  | total loss: 

0.51053

 | time: 85.275s


| Adam | epoch: 003 | loss: 0.51053 - acc: 0.7587 -- iter: 22016/24500


Training Step: 1111  | total loss: 

0.50905

 | time: 85.554s


| Adam | epoch: 003 | loss: 0.50905 - acc: 0.7609 -- iter: 22080/24500


Training Step: 1112  | total loss: 

0.51666

 | time: 85.805s


| Adam | epoch: 003 | loss: 0.51666 - acc: 0.7489 -- iter: 22144/24500


Training Step: 1113  | total loss: 

0.51236

 | time: 86.086s


| Adam | epoch: 003 | loss: 0.51236 - acc: 0.7506 -- iter: 22208/24500


Training Step: 1114  | total loss: 

0.51469

 | time: 86.361s


| Adam | epoch: 003 | loss: 0.51469 - acc: 0.7474 -- iter: 22272/24500


Training Step: 1115  | total loss: 

0.51174

 | time: 86.634s


| Adam | epoch: 003 | loss: 0.51174 - acc: 0.7492 -- iter: 22336/24500


Training Step: 1116  | total loss: 

0.51080

 | time: 86.910s


| Adam | epoch: 003 | loss: 0.51080 - acc: 0.7493 -- iter: 22400/24500


Training Step: 1117  | total loss: 

0.51387

 | time: 87.171s


| Adam | epoch: 003 | loss: 0.51387 - acc: 0.7415 -- iter: 22464/24500


Training Step: 1118  | total loss: 

0.51372

 | time: 87.448s


| Adam | epoch: 003 | loss: 0.51372 - acc: 0.7455 -- iter: 22528/24500


Training Step: 1119  | total loss: 

0.50973

 | time: 87.740s


| Adam | epoch: 003 | loss: 0.50973 - acc: 0.7491 -- iter: 22592/24500


Training Step: 1120  | total loss: 

0.54688

 | time: 88.003s


| Adam | epoch: 003 | loss: 0.54688 - acc: 0.7336 -- iter: 22656/24500


Training Step: 1121  | total loss: 

0.54672

 | time: 88.290s


| Adam | epoch: 003 | loss: 0.54672 - acc: 0.7383 -- iter: 22720/24500


Training Step: 1122  | total loss: 

0.53888

 | time: 88.566s


| Adam | epoch: 003 | loss: 0.53888 - acc: 0.7457 -- iter: 22784/24500


Training Step: 1123  | total loss: 

0.52926

 | time: 88.834s


| Adam | epoch: 003 | loss: 0.52926 - acc: 0.7493 -- iter: 22848/24500


Training Step: 1124  | total loss: 

0.52628

 | time: 89.104s


| Adam | epoch: 003 | loss: 0.52628 - acc: 0.7556 -- iter: 22912/24500


Training Step: 1125  | total loss: 

0.51593

 | time: 89.378s


| Adam | epoch: 003 | loss: 0.51593 - acc: 0.7582 -- iter: 22976/24500


Training Step: 1126  | total loss: 

0.51071

 | time: 89.650s


| Adam | epoch: 003 | loss: 0.51071 - acc: 0.7636 -- iter: 23040/24500


Training Step: 1127  | total loss: 

0.50792

 | time: 89.919s


| Adam | epoch: 003 | loss: 0.50792 - acc: 0.7654 -- iter: 23104/24500


Training Step: 1128  | total loss: 

0.50239

 | time: 90.207s


| Adam | epoch: 003 | loss: 0.50239 - acc: 0.7638 -- iter: 23168/24500


Training Step: 1129  | total loss: 

0.49974

 | time: 90.458s


| Adam | epoch: 003 | loss: 0.49974 - acc: 0.7671 -- iter: 23232/24500


Training Step: 1130  | total loss: 

0.49251

 | time: 90.711s


| Adam | epoch: 003 | loss: 0.49251 - acc: 0.7748 -- iter: 23296/24500


Training Step: 1131  | total loss: 

0.49332

 | time: 90.956s


| Adam | epoch: 003 | loss: 0.49332 - acc: 0.7692 -- iter: 23360/24500


Training Step: 1132  | total loss: 

0.48883

 | time: 91.206s


| Adam | epoch: 003 | loss: 0.48883 - acc: 0.7720 -- iter: 23424/24500


Training Step: 1133  | total loss: 

0.49652

 | time: 91.452s


| Adam | epoch: 003 | loss: 0.49652 - acc: 0.7651 -- iter: 23488/24500


Training Step: 1134  | total loss: 

0.49631

 | time: 91.695s


| Adam | epoch: 003 | loss: 0.49631 - acc: 0.7636 -- iter: 23552/24500


Training Step: 1135  | total loss: 

0.49233

 | time: 91.945s


| Adam | epoch: 003 | loss: 0.49233 - acc: 0.7607 -- iter: 23616/24500


Training Step: 1136  | total loss: 

0.48617

 | time: 92.190s


| Adam | epoch: 003 | loss: 0.48617 - acc: 0.7643 -- iter: 23680/24500


Training Step: 1137  | total loss: 

0.48002

 | time: 92.444s


| Adam | epoch: 003 | loss: 0.48002 - acc: 0.7691 -- iter: 23744/24500


Training Step: 1138  | total loss: 

0.48349

 | time: 92.698s


| Adam | epoch: 003 | loss: 0.48349 - acc: 0.7703 -- iter: 23808/24500


Training Step: 1139  | total loss: 

0.48750

 | time: 92.940s


| Adam | epoch: 003 | loss: 0.48750 - acc: 0.7683 -- iter: 23872/24500


Training Step: 1140  | total loss: 

0.49624

 | time: 93.174s


| Adam | epoch: 003 | loss: 0.49624 - acc: 0.7649 -- iter: 23936/24500


Training Step: 1141  | total loss: 

0.48948

 | time: 93.416s


| Adam | epoch: 003 | loss: 0.48948 - acc: 0.7665 -- iter: 24000/24500


Training Step: 1142  | total loss: 

0.48790

 | time: 93.656s


| Adam | epoch: 003 | loss: 0.48790 - acc: 0.7711 -- iter: 24064/24500


Training Step: 1143  | total loss: 

0.49841

 | time: 93.892s


| Adam | epoch: 003 | loss: 0.49841 - acc: 0.7643 -- iter: 24128/24500


Training Step: 1144  | total loss: 

0.49543

 | time: 94.137s


| Adam | epoch: 003 | loss: 0.49543 - acc: 0.7629 -- iter: 24192/24500


Training Step: 1145  | total loss: 

0.49775

 | time: 94.381s


| Adam | epoch: 003 | loss: 0.49775 - acc: 0.7663 -- iter: 24256/24500


Training Step: 1146  | total loss: 

0.49199

 | time: 94.624s


| Adam | epoch: 003 | loss: 0.49199 - acc: 0.7647 -- iter: 24320/24500


Training Step: 1147  | total loss: 

0.49478

 | time: 94.864s


| Adam | epoch: 003 | loss: 0.49478 - acc: 0.7601 -- iter: 24384/24500


Training Step: 1148  | total loss: 

0.48776

 | time: 95.119s


| Adam | epoch: 003 | loss: 0.48776 - acc: 0.7653 -- iter: 24448/24500


Training Step: 1149  | total loss: 

0.48789

 | time: 96.365s


| Adam | epoch: 003 | loss: 0.48789 - acc: 0.7653 | val_loss: 0.51646 - val_acc: 0.7580 -- iter: 24500/24500
--


Training Step: 1150  | total loss: 

0.49090

 | time: 0.238s


| Adam | epoch: 004 | loss: 0.49090 - acc: 0.7591 -- iter: 00064/24500


Training Step: 1151  | total loss: 

0.49576

 | time: 0.459s


| Adam | epoch: 004 | loss: 0.49576 - acc: 0.7566 -- iter: 00128/24500


Training Step: 1152  | total loss: 

0.49416

 | time: 0.676s


| Adam | epoch: 004 | loss: 0.49416 - acc: 0.7618 -- iter: 00192/24500


Training Step: 1153  | total loss: 

0.49187

 | time: 0.923s


| Adam | epoch: 004 | loss: 0.49187 - acc: 0.7644 -- iter: 00256/24500


Training Step: 1154  | total loss: 

0.49193

 | time: 1.163s


| Adam | epoch: 004 | loss: 0.49193 - acc: 0.7645 -- iter: 00320/24500


Training Step: 1155  | total loss: 

0.49027

 | time: 1.427s


| Adam | epoch: 004 | loss: 0.49027 - acc: 0.7662 -- iter: 00384/24500


Training Step: 1156  | total loss: 

0.49091

 | time: 1.699s


| Adam | epoch: 004 | loss: 0.49091 - acc: 0.7662 -- iter: 00448/24500


Training Step: 1157  | total loss: 

0.48845

 | time: 1.945s


| Adam | epoch: 004 | loss: 0.48845 - acc: 0.7645 -- iter: 00512/24500


Training Step: 1158  | total loss: 

0.49441

 | time: 2.179s


| Adam | epoch: 004 | loss: 0.49441 - acc: 0.7631 -- iter: 00576/24500


Training Step: 1159  | total loss: 

0.48989

 | time: 2.419s


| Adam | epoch: 004 | loss: 0.48989 - acc: 0.7618 -- iter: 00640/24500


Training Step: 1160  | total loss: 

0.48807

 | time: 2.663s


| Adam | epoch: 004 | loss: 0.48807 - acc: 0.7637 -- iter: 00704/24500


Training Step: 1161  | total loss: 

0.49790

 | time: 2.906s


| Adam | epoch: 004 | loss: 0.49790 - acc: 0.7592 -- iter: 00768/24500


Training Step: 1162  | total loss: 

0.50123

 | time: 3.151s


| Adam | epoch: 004 | loss: 0.50123 - acc: 0.7599 -- iter: 00832/24500


Training Step: 1163  | total loss: 

0.49445

 | time: 3.388s


| Adam | epoch: 004 | loss: 0.49445 - acc: 0.7698 -- iter: 00896/24500


Training Step: 1164  | total loss: 

0.48723

 | time: 3.628s


| Adam | epoch: 004 | loss: 0.48723 - acc: 0.7756 -- iter: 00960/24500


Training Step: 1165  | total loss: 

0.48614

 | time: 3.877s


| Adam | epoch: 004 | loss: 0.48614 - acc: 0.7731 -- iter: 01024/24500


Training Step: 1166  | total loss: 

0.49525

 | time: 4.125s


| Adam | epoch: 004 | loss: 0.49525 - acc: 0.7661 -- iter: 01088/24500


Training Step: 1167  | total loss: 

0.48526

 | time: 4.365s


| Adam | epoch: 004 | loss: 0.48526 - acc: 0.7692 -- iter: 01152/24500


Training Step: 1168  | total loss: 

0.48504

 | time: 4.613s


| Adam | epoch: 004 | loss: 0.48504 - acc: 0.7719 -- iter: 01216/24500


Training Step: 1169  | total loss: 

0.47824

 | time: 4.856s


| Adam | epoch: 004 | loss: 0.47824 - acc: 0.7791 -- iter: 01280/24500


Training Step: 1170  | total loss: 

0.47209

 | time: 5.094s


| Adam | epoch: 004 | loss: 0.47209 - acc: 0.7840 -- iter: 01344/24500


Training Step: 1171  | total loss: 

0.46935

 | time: 5.338s


| Adam | epoch: 004 | loss: 0.46935 - acc: 0.7869 -- iter: 01408/24500


Training Step: 1172  | total loss: 

0.45674

 | time: 5.588s


| Adam | epoch: 004 | loss: 0.45674 - acc: 0.7910 -- iter: 01472/24500


Training Step: 1173  | total loss: 

0.46023

 | time: 5.824s


| Adam | epoch: 004 | loss: 0.46023 - acc: 0.7869 -- iter: 01536/24500


Training Step: 1174  | total loss: 

0.45211

 | time: 6.067s


| Adam | epoch: 004 | loss: 0.45211 - acc: 0.7848 -- iter: 01600/24500


Training Step: 1175  | total loss: 

0.46085

 | time: 6.305s


| Adam | epoch: 004 | loss: 0.46085 - acc: 0.7735 -- iter: 01664/24500


Training Step: 1176  | total loss: 

0.47009

 | time: 6.552s


| Adam | epoch: 004 | loss: 0.47009 - acc: 0.7727 -- iter: 01728/24500


Training Step: 1177  | total loss: 

0.46124

 | time: 6.796s


| Adam | epoch: 004 | loss: 0.46124 - acc: 0.7814 -- iter: 01792/24500


Training Step: 1178  | total loss: 

0.46813

 | time: 7.040s


| Adam | epoch: 004 | loss: 0.46813 - acc: 0.7782 -- iter: 01856/24500


Training Step: 1179  | total loss: 

0.46318

 | time: 7.276s


| Adam | epoch: 004 | loss: 0.46318 - acc: 0.7801 -- iter: 01920/24500


Training Step: 1180  | total loss: 

0.46897

 | time: 7.523s


| Adam | epoch: 004 | loss: 0.46897 - acc: 0.7708 -- iter: 01984/24500


Training Step: 1181  | total loss: 

0.47602

 | time: 7.765s


| Adam | epoch: 004 | loss: 0.47602 - acc: 0.7656 -- iter: 02048/24500


Training Step: 1182  | total loss: 

0.46928

 | time: 8.005s


| Adam | epoch: 004 | loss: 0.46928 - acc: 0.7734 -- iter: 02112/24500


Training Step: 1183  | total loss: 

0.47333

 | time: 8.247s


| Adam | epoch: 004 | loss: 0.47333 - acc: 0.7695 -- iter: 02176/24500


Training Step: 1184  | total loss: 

0.47280

 | time: 8.487s


| Adam | epoch: 004 | loss: 0.47280 - acc: 0.7676 -- iter: 02240/24500


Training Step: 1185  | total loss: 

0.48875

 | time: 8.732s


| Adam | epoch: 004 | loss: 0.48875 - acc: 0.7611 -- iter: 02304/24500


Training Step: 1186  | total loss: 

0.49792

 | time: 8.973s


| Adam | epoch: 004 | loss: 0.49792 - acc: 0.7585 -- iter: 02368/24500


Training Step: 1187  | total loss: 

0.50891

 | time: 9.221s


| Adam | epoch: 004 | loss: 0.50891 - acc: 0.7498 -- iter: 02432/24500


Training Step: 1188  | total loss: 

0.49950

 | time: 9.464s


| Adam | epoch: 004 | loss: 0.49950 - acc: 0.7592 -- iter: 02496/24500


Training Step: 1189  | total loss: 

0.49946

 | time: 9.711s


| Adam | epoch: 004 | loss: 0.49946 - acc: 0.7645 -- iter: 02560/24500


Training Step: 1190  | total loss: 

0.49914

 | time: 9.950s


| Adam | epoch: 004 | loss: 0.49914 - acc: 0.7631 -- iter: 02624/24500


Training Step: 1191  | total loss: 

0.49510

 | time: 10.186s


| Adam | epoch: 004 | loss: 0.49510 - acc: 0.7665 -- iter: 02688/24500


Training Step: 1192  | total loss: 

0.48443

 | time: 10.424s


| Adam | epoch: 004 | loss: 0.48443 - acc: 0.7742 -- iter: 02752/24500


Training Step: 1193  | total loss: 

0.48757

 | time: 10.671s


| Adam | epoch: 004 | loss: 0.48757 - acc: 0.7702 -- iter: 02816/24500


Training Step: 1194  | total loss: 

0.48797

 | time: 10.919s


| Adam | epoch: 004 | loss: 0.48797 - acc: 0.7713 -- iter: 02880/24500


Training Step: 1195  | total loss: 

0.48732

 | time: 11.164s


| Adam | epoch: 004 | loss: 0.48732 - acc: 0.7692 -- iter: 02944/24500


Training Step: 1196  | total loss: 

0.49101

 | time: 11.409s


| Adam | epoch: 004 | loss: 0.49101 - acc: 0.7626 -- iter: 03008/24500


Training Step: 1197  | total loss: 

0.48620

 | time: 11.657s


| Adam | epoch: 004 | loss: 0.48620 - acc: 0.7676 -- iter: 03072/24500


Training Step: 1198  | total loss: 

0.48354

 | time: 11.903s


| Adam | epoch: 004 | loss: 0.48354 - acc: 0.7627 -- iter: 03136/24500


Training Step: 1199  | total loss: 

0.48599

 | time: 12.145s


| Adam | epoch: 004 | loss: 0.48599 - acc: 0.7630 -- iter: 03200/24500


Training Step: 1200  | total loss: 

0.47391

 | time: 12.387s


| Adam | epoch: 004 | loss: 0.47391 - acc: 0.7695 -- iter: 03264/24500


Training Step: 1201  | total loss: 

0.46626

 | time: 12.640s


| Adam | epoch: 004 | loss: 0.46626 - acc: 0.7738 -- iter: 03328/24500


Training Step: 1202  | total loss: 

0.46043

 | time: 12.870s


| Adam | epoch: 004 | loss: 0.46043 - acc: 0.7777 -- iter: 03392/24500


Training Step: 1203  | total loss: 

0.45390

 | time: 13.107s


| Adam | epoch: 004 | loss: 0.45390 - acc: 0.7811 -- iter: 03456/24500


Training Step: 1204  | total loss: 

0.45588

 | time: 13.350s


| Adam | epoch: 004 | loss: 0.45588 - acc: 0.7780 -- iter: 03520/24500


Training Step: 1205  | total loss: 

0.46804

 | time: 13.606s


| Adam | epoch: 004 | loss: 0.46804 - acc: 0.7690 -- iter: 03584/24500


Training Step: 1206  | total loss: 

0.46534

 | time: 13.857s


| Adam | epoch: 004 | loss: 0.46534 - acc: 0.7718 -- iter: 03648/24500


Training Step: 1207  | total loss: 

0.46422

 | time: 14.098s


| Adam | epoch: 004 | loss: 0.46422 - acc: 0.7712 -- iter: 03712/24500


Training Step: 1208  | total loss: 

0.45716

 | time: 14.342s


| Adam | epoch: 004 | loss: 0.45716 - acc: 0.7784 -- iter: 03776/24500


Training Step: 1209  | total loss: 

0.45171

 | time: 14.590s


| Adam | epoch: 004 | loss: 0.45171 - acc: 0.7834 -- iter: 03840/24500


Training Step: 1210  | total loss: 

0.47398

 | time: 14.838s


| Adam | epoch: 004 | loss: 0.47398 - acc: 0.7769 -- iter: 03904/24500


Training Step: 1211  | total loss: 

0.48724

 | time: 15.085s


| Adam | epoch: 004 | loss: 0.48724 - acc: 0.7680 -- iter: 03968/24500


Training Step: 1212  | total loss: 

0.48600

 | time: 15.322s


| Adam | epoch: 004 | loss: 0.48600 - acc: 0.7724 -- iter: 04032/24500


Training Step: 1213  | total loss: 

0.47791

 | time: 15.561s


| Adam | epoch: 004 | loss: 0.47791 - acc: 0.7733 -- iter: 04096/24500


Training Step: 1214  | total loss: 

0.47084

 | time: 15.800s


| Adam | epoch: 004 | loss: 0.47084 - acc: 0.7757 -- iter: 04160/24500


Training Step: 1215  | total loss: 

0.47128

 | time: 16.043s


| Adam | epoch: 004 | loss: 0.47128 - acc: 0.7731 -- iter: 04224/24500


Training Step: 1216  | total loss: 

0.47744

 | time: 16.281s


| Adam | epoch: 004 | loss: 0.47744 - acc: 0.7661 -- iter: 04288/24500


Training Step: 1217  | total loss: 

0.47789

 | time: 16.516s


| Adam | epoch: 004 | loss: 0.47789 - acc: 0.7661 -- iter: 04352/24500


Training Step: 1218  | total loss: 

0.47925

 | time: 16.763s


| Adam | epoch: 004 | loss: 0.47925 - acc: 0.7645 -- iter: 04416/24500


Training Step: 1219  | total loss: 

0.47557

 | time: 17.002s


| Adam | epoch: 004 | loss: 0.47557 - acc: 0.7677 -- iter: 04480/24500


Training Step: 1220  | total loss: 

0.46905

 | time: 17.241s


| Adam | epoch: 004 | loss: 0.46905 - acc: 0.7769 -- iter: 04544/24500


Training Step: 1221  | total loss: 

0.47097

 | time: 17.491s


| Adam | epoch: 004 | loss: 0.47097 - acc: 0.7757 -- iter: 04608/24500


Training Step: 1222  | total loss: 

0.47292

 | time: 17.735s


| Adam | epoch: 004 | loss: 0.47292 - acc: 0.7732 -- iter: 04672/24500


Training Step: 1223  | total loss: 

0.48376

 | time: 17.981s


| Adam | epoch: 004 | loss: 0.48376 - acc: 0.7662 -- iter: 04736/24500


Training Step: 1224  | total loss: 

0.47484

 | time: 18.231s


| Adam | epoch: 004 | loss: 0.47484 - acc: 0.7755 -- iter: 04800/24500


Training Step: 1225  | total loss: 

0.46909

 | time: 18.476s


| Adam | epoch: 004 | loss: 0.46909 - acc: 0.7807 -- iter: 04864/24500


Training Step: 1226  | total loss: 

0.47264

 | time: 18.728s


| Adam | epoch: 004 | loss: 0.47264 - acc: 0.7745 -- iter: 04928/24500


Training Step: 1227  | total loss: 

0.46686

 | time: 18.975s


| Adam | epoch: 004 | loss: 0.46686 - acc: 0.7799 -- iter: 04992/24500


Training Step: 1228  | total loss: 

0.47349

 | time: 19.211s


| Adam | epoch: 004 | loss: 0.47349 - acc: 0.7722 -- iter: 05056/24500


Training Step: 1229  | total loss: 

0.47575

 | time: 19.459s


| Adam | epoch: 004 | loss: 0.47575 - acc: 0.7716 -- iter: 05120/24500


Training Step: 1230  | total loss: 

0.49764

 | time: 19.703s


| Adam | epoch: 004 | loss: 0.49764 - acc: 0.7585 -- iter: 05184/24500


Training Step: 1231  | total loss: 

0.49136

 | time: 19.931s


| Adam | epoch: 004 | loss: 0.49136 - acc: 0.7701 -- iter: 05248/24500


Training Step: 1232  | total loss: 

0.49651

 | time: 20.181s


| Adam | epoch: 004 | loss: 0.49651 - acc: 0.7634 -- iter: 05312/24500


Training Step: 1233  | total loss: 

0.49831

 | time: 20.422s


| Adam | epoch: 004 | loss: 0.49831 - acc: 0.7590 -- iter: 05376/24500


Training Step: 1234  | total loss: 

0.48236

 | time: 20.677s


| Adam | epoch: 004 | loss: 0.48236 - acc: 0.7674 -- iter: 05440/24500


Training Step: 1235  | total loss: 

0.47176

 | time: 20.924s


| Adam | epoch: 004 | loss: 0.47176 - acc: 0.7735 -- iter: 05504/24500


Training Step: 1236  | total loss: 

0.46903

 | time: 21.163s


| Adam | epoch: 004 | loss: 0.46903 - acc: 0.7712 -- iter: 05568/24500


Training Step: 1237  | total loss: 

0.46307

 | time: 21.411s


| Adam | epoch: 004 | loss: 0.46307 - acc: 0.7737 -- iter: 05632/24500


Training Step: 1238  | total loss: 

0.46198

 | time: 21.649s


| Adam | epoch: 004 | loss: 0.46198 - acc: 0.7776 -- iter: 05696/24500


Training Step: 1239  | total loss: 

0.47081

 | time: 21.897s


| Adam | epoch: 004 | loss: 0.47081 - acc: 0.7764 -- iter: 05760/24500


Training Step: 1240  | total loss: 

0.48130

 | time: 22.142s


| Adam | epoch: 004 | loss: 0.48130 - acc: 0.7644 -- iter: 05824/24500


Training Step: 1241  | total loss: 

0.48945

 | time: 22.381s


| Adam | epoch: 004 | loss: 0.48945 - acc: 0.7598 -- iter: 05888/24500


Training Step: 1242  | total loss: 

0.48826

 | time: 22.617s


| Adam | epoch: 004 | loss: 0.48826 - acc: 0.7588 -- iter: 05952/24500


Training Step: 1243  | total loss: 

0.48618

 | time: 22.863s


| Adam | epoch: 004 | loss: 0.48618 - acc: 0.7564 -- iter: 06016/24500


Training Step: 1244  | total loss: 

0.48581

 | time: 23.112s


| Adam | epoch: 004 | loss: 0.48581 - acc: 0.7526 -- iter: 06080/24500


Training Step: 1245  | total loss: 

0.48211

 | time: 23.349s


| Adam | epoch: 004 | loss: 0.48211 - acc: 0.7555 -- iter: 06144/24500


Training Step: 1246  | total loss: 

0.46599

 | time: 23.593s


| Adam | epoch: 004 | loss: 0.46599 - acc: 0.7706 -- iter: 06208/24500


Training Step: 1247  | total loss: 

0.47043

 | time: 23.845s


| Adam | epoch: 004 | loss: 0.47043 - acc: 0.7701 -- iter: 06272/24500


Training Step: 1248  | total loss: 

0.47811

 | time: 24.087s


| Adam | epoch: 004 | loss: 0.47811 - acc: 0.7681 -- iter: 06336/24500


Training Step: 1249  | total loss: 

0.48802

 | time: 24.324s


| Adam | epoch: 004 | loss: 0.48802 - acc: 0.7631 -- iter: 06400/24500


Training Step: 1250  | total loss: 

0.48536

 | time: 24.568s


| Adam | epoch: 004 | loss: 0.48536 - acc: 0.7634 -- iter: 06464/24500


Training Step: 1251  | total loss: 

0.48485

 | time: 24.821s


| Adam | epoch: 004 | loss: 0.48485 - acc: 0.7699 -- iter: 06528/24500


Training Step: 1252  | total loss: 

0.48771

 | time: 25.070s


| Adam | epoch: 004 | loss: 0.48771 - acc: 0.7632 -- iter: 06592/24500


Training Step: 1253  | total loss: 

0.49018

 | time: 25.320s


| Adam | epoch: 004 | loss: 0.49018 - acc: 0.7603 -- iter: 06656/24500


Training Step: 1254  | total loss: 

0.48516

 | time: 25.563s


| Adam | epoch: 004 | loss: 0.48516 - acc: 0.7624 -- iter: 06720/24500


Training Step: 1255  | total loss: 

0.48343

 | time: 25.806s


| Adam | epoch: 004 | loss: 0.48343 - acc: 0.7643 -- iter: 06784/24500


Training Step: 1256  | total loss: 

0.47965

 | time: 26.040s


| Adam | epoch: 004 | loss: 0.47965 - acc: 0.7675 -- iter: 06848/24500


Training Step: 1257  | total loss: 

0.48674

 | time: 26.280s


| Adam | epoch: 004 | loss: 0.48674 - acc: 0.7595 -- iter: 06912/24500


Training Step: 1258  | total loss: 

0.48086

 | time: 26.518s


| Adam | epoch: 004 | loss: 0.48086 - acc: 0.7648 -- iter: 06976/24500


Training Step: 1259  | total loss: 

0.47909

 | time: 26.758s


| Adam | epoch: 004 | loss: 0.47909 - acc: 0.7602 -- iter: 07040/24500


Training Step: 1260  | total loss: 

0.48489

 | time: 26.998s


| Adam | epoch: 004 | loss: 0.48489 - acc: 0.7576 -- iter: 07104/24500


Training Step: 1261  | total loss: 

0.48643

 | time: 27.249s


| Adam | epoch: 004 | loss: 0.48643 - acc: 0.7569 -- iter: 07168/24500


Training Step: 1262  | total loss: 

0.48204

 | time: 27.491s


| Adam | epoch: 004 | loss: 0.48204 - acc: 0.7593 -- iter: 07232/24500


Training Step: 1263  | total loss: 

0.46909

 | time: 27.725s


| Adam | epoch: 004 | loss: 0.46909 - acc: 0.7740 -- iter: 07296/24500


Training Step: 1264  | total loss: 

0.47004

 | time: 27.960s


| Adam | epoch: 004 | loss: 0.47004 - acc: 0.7794 -- iter: 07360/24500


Training Step: 1265  | total loss: 

0.47487

 | time: 28.199s


| Adam | epoch: 004 | loss: 0.47487 - acc: 0.7749 -- iter: 07424/24500


Training Step: 1266  | total loss: 

0.47653

 | time: 28.441s


| Adam | epoch: 004 | loss: 0.47653 - acc: 0.7709 -- iter: 07488/24500


Training Step: 1267  | total loss: 

0.47334

 | time: 28.682s


| Adam | epoch: 004 | loss: 0.47334 - acc: 0.7750 -- iter: 07552/24500


Training Step: 1268  | total loss: 

0.46638

 | time: 28.913s


| Adam | epoch: 004 | loss: 0.46638 - acc: 0.7803 -- iter: 07616/24500


Training Step: 1269  | total loss: 

0.48039

 | time: 29.163s


| Adam | epoch: 004 | loss: 0.48039 - acc: 0.7695 -- iter: 07680/24500


Training Step: 1270  | total loss: 

0.48699

 | time: 29.410s


| Adam | epoch: 004 | loss: 0.48699 - acc: 0.7550 -- iter: 07744/24500


Training Step: 1271  | total loss: 

0.48638

 | time: 29.655s


| Adam | epoch: 004 | loss: 0.48638 - acc: 0.7577 -- iter: 07808/24500


Training Step: 1272  | total loss: 

0.48485

 | time: 29.901s


| Adam | epoch: 004 | loss: 0.48485 - acc: 0.7585 -- iter: 07872/24500


Training Step: 1273  | total loss: 

0.48034

 | time: 30.145s


| Adam | epoch: 004 | loss: 0.48034 - acc: 0.7560 -- iter: 07936/24500


Training Step: 1274  | total loss: 

0.48168

 | time: 30.378s


| Adam | epoch: 004 | loss: 0.48168 - acc: 0.7570 -- iter: 08000/24500


Training Step: 1275  | total loss: 

0.49016

 | time: 30.620s


| Adam | epoch: 004 | loss: 0.49016 - acc: 0.7532 -- iter: 08064/24500


Training Step: 1276  | total loss: 

0.50123

 | time: 30.865s


| Adam | epoch: 004 | loss: 0.50123 - acc: 0.7466 -- iter: 08128/24500


Training Step: 1277  | total loss: 

0.49446

 | time: 31.109s


| Adam | epoch: 004 | loss: 0.49446 - acc: 0.7454 -- iter: 08192/24500


Training Step: 1278  | total loss: 

0.48899

 | time: 31.346s


| Adam | epoch: 004 | loss: 0.48899 - acc: 0.7490 -- iter: 08256/24500


Training Step: 1279  | total loss: 

0.48917

 | time: 31.603s


| Adam | epoch: 004 | loss: 0.48917 - acc: 0.7460 -- iter: 08320/24500


Training Step: 1280  | total loss: 

0.48044

 | time: 31.877s


| Adam | epoch: 004 | loss: 0.48044 - acc: 0.7589 -- iter: 08384/24500


Training Step: 1281  | total loss: 

0.47599

 | time: 32.161s


| Adam | epoch: 004 | loss: 0.47599 - acc: 0.7689 -- iter: 08448/24500


Training Step: 1282  | total loss: 

0.47640

 | time: 32.422s


| Adam | epoch: 004 | loss: 0.47640 - acc: 0.7686 -- iter: 08512/24500


Training Step: 1283  | total loss: 

0.48193

 | time: 32.694s


| Adam | epoch: 004 | loss: 0.48193 - acc: 0.7605 -- iter: 08576/24500


Training Step: 1284  | total loss: 

0.47356

 | time: 32.982s


| Adam | epoch: 004 | loss: 0.47356 - acc: 0.7672 -- iter: 08640/24500


Training Step: 1285  | total loss: 

0.47313

 | time: 33.257s


| Adam | epoch: 004 | loss: 0.47313 - acc: 0.7671 -- iter: 08704/24500


Training Step: 1286  | total loss: 

0.47238

 | time: 33.500s


| Adam | epoch: 004 | loss: 0.47238 - acc: 0.7716 -- iter: 08768/24500


Training Step: 1287  | total loss: 

0.46954

 | time: 33.756s


| Adam | epoch: 004 | loss: 0.46954 - acc: 0.7710 -- iter: 08832/24500


Training Step: 1288  | total loss: 

0.47635

 | time: 34.001s


| Adam | epoch: 004 | loss: 0.47635 - acc: 0.7689 -- iter: 08896/24500


Training Step: 1289  | total loss: 

0.47486

 | time: 34.240s


| Adam | epoch: 004 | loss: 0.47486 - acc: 0.7717 -- iter: 08960/24500


Training Step: 1290  | total loss: 

0.47608

 | time: 34.475s


| Adam | epoch: 004 | loss: 0.47608 - acc: 0.7695 -- iter: 09024/24500


Training Step: 1291  | total loss: 

0.48085

 | time: 34.716s


| Adam | epoch: 004 | loss: 0.48085 - acc: 0.7692 -- iter: 09088/24500


Training Step: 1292  | total loss: 

0.48296

 | time: 34.968s


| Adam | epoch: 004 | loss: 0.48296 - acc: 0.7657 -- iter: 09152/24500


Training Step: 1293  | total loss: 

0.48846

 | time: 35.213s


| Adam | epoch: 004 | loss: 0.48846 - acc: 0.7610 -- iter: 09216/24500


Training Step: 1294  | total loss: 

0.48584

 | time: 35.459s


| Adam | epoch: 004 | loss: 0.48584 - acc: 0.7630 -- iter: 09280/24500


Training Step: 1295  | total loss: 

0.47473

 | time: 35.689s


| Adam | epoch: 004 | loss: 0.47473 - acc: 0.7711 -- iter: 09344/24500


Training Step: 1296  | total loss: 

0.47502

 | time: 35.930s


| Adam | epoch: 004 | loss: 0.47502 - acc: 0.7737 -- iter: 09408/24500


Training Step: 1297  | total loss: 

0.48316

 | time: 36.177s


| Adam | epoch: 004 | loss: 0.48316 - acc: 0.7697 -- iter: 09472/24500


Training Step: 1298  | total loss: 

0.48795

 | time: 36.422s


| Adam | epoch: 004 | loss: 0.48795 - acc: 0.7662 -- iter: 09536/24500


Training Step: 1299  | total loss: 

0.49059

 | time: 36.663s


| Adam | epoch: 004 | loss: 0.49059 - acc: 0.7646 -- iter: 09600/24500


Training Step: 1300  | total loss: 

0.48790

 | time: 36.908s


| Adam | epoch: 004 | loss: 0.48790 - acc: 0.7662 -- iter: 09664/24500


Training Step: 1301  | total loss: 

0.48791

 | time: 37.157s


| Adam | epoch: 004 | loss: 0.48791 - acc: 0.7693 -- iter: 09728/24500


Training Step: 1302  | total loss: 

0.48478

 | time: 37.404s


| Adam | epoch: 004 | loss: 0.48478 - acc: 0.7783 -- iter: 09792/24500


Training Step: 1303  | total loss: 

0.49202

 | time: 37.642s


| Adam | epoch: 004 | loss: 0.49202 - acc: 0.7739 -- iter: 09856/24500


Training Step: 1304  | total loss: 

0.49568

 | time: 37.881s


| Adam | epoch: 004 | loss: 0.49568 - acc: 0.7700 -- iter: 09920/24500


Training Step: 1305  | total loss: 

0.48827

 | time: 38.123s


| Adam | epoch: 004 | loss: 0.48827 - acc: 0.7742 -- iter: 09984/24500


Training Step: 1306  | total loss: 

0.50262

 | time: 38.371s


| Adam | epoch: 004 | loss: 0.50262 - acc: 0.7702 -- iter: 10048/24500


Training Step: 1307  | total loss: 

0.50219

 | time: 38.607s


| Adam | epoch: 004 | loss: 0.50219 - acc: 0.7698 -- iter: 10112/24500


Training Step: 1308  | total loss: 

0.50222

 | time: 38.847s


| Adam | epoch: 004 | loss: 0.50222 - acc: 0.7678 -- iter: 10176/24500


Training Step: 1309  | total loss: 

0.50084

 | time: 39.092s


| Adam | epoch: 004 | loss: 0.50084 - acc: 0.7691 -- iter: 10240/24500


Training Step: 1310  | total loss: 

0.52172

 | time: 39.337s


| Adam | epoch: 004 | loss: 0.52172 - acc: 0.7579 -- iter: 10304/24500


Training Step: 1311  | total loss: 

0.52061

 | time: 39.577s


| Adam | epoch: 004 | loss: 0.52061 - acc: 0.7555 -- iter: 10368/24500


Training Step: 1312  | total loss: 

0.52162

 | time: 39.827s


| Adam | epoch: 004 | loss: 0.52162 - acc: 0.7518 -- iter: 10432/24500


Training Step: 1313  | total loss: 

0.52279

 | time: 40.080s


| Adam | epoch: 004 | loss: 0.52279 - acc: 0.7501 -- iter: 10496/24500


Training Step: 1314  | total loss: 

0.51712

 | time: 40.327s


| Adam | epoch: 004 | loss: 0.51712 - acc: 0.7579 -- iter: 10560/24500


Training Step: 1315  | total loss: 

0.50026

 | time: 40.563s


| Adam | epoch: 004 | loss: 0.50026 - acc: 0.7665 -- iter: 10624/24500


Training Step: 1316  | total loss: 

0.50698

 | time: 40.800s


| Adam | epoch: 004 | loss: 0.50698 - acc: 0.7570 -- iter: 10688/24500


Training Step: 1317  | total loss: 

0.50632

 | time: 41.051s


| Adam | epoch: 004 | loss: 0.50632 - acc: 0.7548 -- iter: 10752/24500


Training Step: 1318  | total loss: 

0.50195

 | time: 41.300s


| Adam | epoch: 004 | loss: 0.50195 - acc: 0.7590 -- iter: 10816/24500


Training Step: 1319  | total loss: 

0.49700

 | time: 41.551s


| Adam | epoch: 004 | loss: 0.49700 - acc: 0.7549 -- iter: 10880/24500


Training Step: 1320  | total loss: 

0.49630

 | time: 41.791s


| Adam | epoch: 004 | loss: 0.49630 - acc: 0.7560 -- iter: 10944/24500


Training Step: 1321  | total loss: 

0.49281

 | time: 42.040s


| Adam | epoch: 004 | loss: 0.49281 - acc: 0.7585 -- iter: 11008/24500


Training Step: 1322  | total loss: 

0.49995

 | time: 42.278s


| Adam | epoch: 004 | loss: 0.49995 - acc: 0.7499 -- iter: 11072/24500


Training Step: 1323  | total loss: 

0.49895

 | time: 42.515s


| Adam | epoch: 004 | loss: 0.49895 - acc: 0.7499 -- iter: 11136/24500


Training Step: 1324  | total loss: 

0.50119

 | time: 42.765s


| Adam | epoch: 004 | loss: 0.50119 - acc: 0.7499 -- iter: 11200/24500


Training Step: 1325  | total loss: 

0.50158

 | time: 43.009s


| Adam | epoch: 004 | loss: 0.50158 - acc: 0.7546 -- iter: 11264/24500


Training Step: 1326  | total loss: 

0.48646

 | time: 43.252s


| Adam | epoch: 004 | loss: 0.48646 - acc: 0.7666 -- iter: 11328/24500


Training Step: 1327  | total loss: 

0.48236

 | time: 43.497s


| Adam | epoch: 004 | loss: 0.48236 - acc: 0.7712 -- iter: 11392/24500


Training Step: 1328  | total loss: 

0.47970

 | time: 43.742s


| Adam | epoch: 004 | loss: 0.47970 - acc: 0.7722 -- iter: 11456/24500


Training Step: 1329  | total loss: 

0.48023

 | time: 43.983s


| Adam | epoch: 004 | loss: 0.48023 - acc: 0.7684 -- iter: 11520/24500


Training Step: 1330  | total loss: 

0.48518

 | time: 44.227s


| Adam | epoch: 004 | loss: 0.48518 - acc: 0.7682 -- iter: 11584/24500


Training Step: 1331  | total loss: 

0.47778

 | time: 44.490s


| Adam | epoch: 004 | loss: 0.47778 - acc: 0.7710 -- iter: 11648/24500


Training Step: 1332  | total loss: 

0.47688

 | time: 44.775s


| Adam | epoch: 004 | loss: 0.47688 - acc: 0.7736 -- iter: 11712/24500


Training Step: 1333  | total loss: 

0.47518

 | time: 45.012s


| Adam | epoch: 004 | loss: 0.47518 - acc: 0.7713 -- iter: 11776/24500


Training Step: 1334  | total loss: 

0.49121

 | time: 45.259s


| Adam | epoch: 004 | loss: 0.49121 - acc: 0.7644 -- iter: 11840/24500


Training Step: 1335  | total loss: 

0.48720

 | time: 45.495s


| Adam | epoch: 004 | loss: 0.48720 - acc: 0.7661 -- iter: 11904/24500


Training Step: 1336  | total loss: 

0.47772

 | time: 45.739s


| Adam | epoch: 004 | loss: 0.47772 - acc: 0.7723 -- iter: 11968/24500


Training Step: 1337  | total loss: 

0.47699

 | time: 45.980s


| Adam | epoch: 004 | loss: 0.47699 - acc: 0.7701 -- iter: 12032/24500


Training Step: 1338  | total loss: 

0.48222

 | time: 46.228s


| Adam | epoch: 004 | loss: 0.48222 - acc: 0.7728 -- iter: 12096/24500


Training Step: 1339  | total loss: 

0.48424

 | time: 46.475s


| Adam | epoch: 004 | loss: 0.48424 - acc: 0.7674 -- iter: 12160/24500


Training Step: 1340  | total loss: 

0.49467

 | time: 46.717s


| Adam | epoch: 004 | loss: 0.49467 - acc: 0.7563 -- iter: 12224/24500


Training Step: 1341  | total loss: 

0.49335

 | time: 46.957s


| Adam | epoch: 004 | loss: 0.49335 - acc: 0.7572 -- iter: 12288/24500


Training Step: 1342  | total loss: 

0.48694

 | time: 47.210s


| Adam | epoch: 004 | loss: 0.48694 - acc: 0.7612 -- iter: 12352/24500


Training Step: 1343  | total loss: 

0.48602

 | time: 47.454s


| Adam | epoch: 004 | loss: 0.48602 - acc: 0.7600 -- iter: 12416/24500


Training Step: 1344  | total loss: 

0.48814

 | time: 47.697s


| Adam | epoch: 004 | loss: 0.48814 - acc: 0.7622 -- iter: 12480/24500


Training Step: 1345  | total loss: 

0.50133

 | time: 47.942s


| Adam | epoch: 004 | loss: 0.50133 - acc: 0.7500 -- iter: 12544/24500


Training Step: 1346  | total loss: 

0.49874

 | time: 48.187s


| Adam | epoch: 004 | loss: 0.49874 - acc: 0.7516 -- iter: 12608/24500


Training Step: 1347  | total loss: 

0.50182

 | time: 48.432s


| Adam | epoch: 004 | loss: 0.50182 - acc: 0.7514 -- iter: 12672/24500


Training Step: 1348  | total loss: 

0.49640

 | time: 48.670s


| Adam | epoch: 004 | loss: 0.49640 - acc: 0.7591 -- iter: 12736/24500


Training Step: 1349  | total loss: 

0.49427

 | time: 48.912s


| Adam | epoch: 004 | loss: 0.49427 - acc: 0.7676 -- iter: 12800/24500


Training Step: 1350  | total loss: 

0.50172

 | time: 49.152s


| Adam | epoch: 004 | loss: 0.50172 - acc: 0.7580 -- iter: 12864/24500


Training Step: 1351  | total loss: 

0.50777

 | time: 49.400s


| Adam | epoch: 004 | loss: 0.50777 - acc: 0.7556 -- iter: 12928/24500


Training Step: 1352  | total loss: 

0.49876

 | time: 49.640s


| Adam | epoch: 004 | loss: 0.49876 - acc: 0.7566 -- iter: 12992/24500


Training Step: 1353  | total loss: 

0.49808

 | time: 49.885s


| Adam | epoch: 004 | loss: 0.49808 - acc: 0.7591 -- iter: 13056/24500


Training Step: 1354  | total loss: 

0.49050

 | time: 50.132s


| Adam | epoch: 004 | loss: 0.49050 - acc: 0.7597 -- iter: 13120/24500


Training Step: 1355  | total loss: 

0.48298

 | time: 50.377s


| Adam | epoch: 004 | loss: 0.48298 - acc: 0.7666 -- iter: 13184/24500


Training Step: 1356  | total loss: 

0.48566

 | time: 50.607s


| Adam | epoch: 004 | loss: 0.48566 - acc: 0.7696 -- iter: 13248/24500


Training Step: 1357  | total loss: 

0.49645

 | time: 50.859s


| Adam | epoch: 004 | loss: 0.49645 - acc: 0.7598 -- iter: 13312/24500


Training Step: 1358  | total loss: 

0.49084

 | time: 51.106s


| Adam | epoch: 004 | loss: 0.49084 - acc: 0.7682 -- iter: 13376/24500


Training Step: 1359  | total loss: 

0.49354

 | time: 51.350s


| Adam | epoch: 004 | loss: 0.49354 - acc: 0.7633 -- iter: 13440/24500


Training Step: 1360  | total loss: 

0.49431

 | time: 51.592s


| Adam | epoch: 004 | loss: 0.49431 - acc: 0.7620 -- iter: 13504/24500


Training Step: 1361  | total loss: 

0.49356

 | time: 51.837s


| Adam | epoch: 004 | loss: 0.49356 - acc: 0.7639 -- iter: 13568/24500


Training Step: 1362  | total loss: 

0.48498

 | time: 52.081s


| Adam | epoch: 004 | loss: 0.48498 - acc: 0.7703 -- iter: 13632/24500


Training Step: 1363  | total loss: 

0.47687

 | time: 52.329s


| Adam | epoch: 004 | loss: 0.47687 - acc: 0.7698 -- iter: 13696/24500


Training Step: 1364  | total loss: 

0.47583

 | time: 52.578s


| Adam | epoch: 004 | loss: 0.47583 - acc: 0.7632 -- iter: 13760/24500


Training Step: 1365  | total loss: 

0.47100

 | time: 52.824s


| Adam | epoch: 004 | loss: 0.47100 - acc: 0.7697 -- iter: 13824/24500


Training Step: 1366  | total loss: 

0.48589

 | time: 53.071s


| Adam | epoch: 004 | loss: 0.48589 - acc: 0.7630 -- iter: 13888/24500


Training Step: 1367  | total loss: 

0.48576

 | time: 53.311s


| Adam | epoch: 004 | loss: 0.48576 - acc: 0.7664 -- iter: 13952/24500


Training Step: 1368  | total loss: 

0.48636

 | time: 53.575s


| Adam | epoch: 004 | loss: 0.48636 - acc: 0.7679 -- iter: 14016/24500


Training Step: 1369  | total loss: 

0.49359

 | time: 53.828s


| Adam | epoch: 004 | loss: 0.49359 - acc: 0.7567 -- iter: 14080/24500


Training Step: 1370  | total loss: 

0.48915

 | time: 54.058s


| Adam | epoch: 004 | loss: 0.48915 - acc: 0.7607 -- iter: 14144/24500


Training Step: 1371  | total loss: 

0.49139

 | time: 54.309s


| Adam | epoch: 004 | loss: 0.49139 - acc: 0.7628 -- iter: 14208/24500


Training Step: 1372  | total loss: 

0.48239

 | time: 54.553s


| Adam | epoch: 004 | loss: 0.48239 - acc: 0.7756 -- iter: 14272/24500


Training Step: 1373  | total loss: 

0.48031

 | time: 54.789s


| Adam | epoch: 004 | loss: 0.48031 - acc: 0.7714 -- iter: 14336/24500


Training Step: 1374  | total loss: 

0.48262

 | time: 55.037s


| Adam | epoch: 004 | loss: 0.48262 - acc: 0.7693 -- iter: 14400/24500


Training Step: 1375  | total loss: 

0.48636

 | time: 55.277s


| Adam | epoch: 004 | loss: 0.48636 - acc: 0.7674 -- iter: 14464/24500


Training Step: 1376  | total loss: 

0.48747

 | time: 55.517s


| Adam | epoch: 004 | loss: 0.48747 - acc: 0.7625 -- iter: 14528/24500


Training Step: 1377  | total loss: 

0.48795

 | time: 55.752s


| Adam | epoch: 004 | loss: 0.48795 - acc: 0.7581 -- iter: 14592/24500


Training Step: 1378  | total loss: 

0.49080

 | time: 55.998s


| Adam | epoch: 004 | loss: 0.49080 - acc: 0.7526 -- iter: 14656/24500


Training Step: 1379  | total loss: 

0.49187

 | time: 56.235s


| Adam | epoch: 004 | loss: 0.49187 - acc: 0.7524 -- iter: 14720/24500


Training Step: 1380  | total loss: 

0.48746

 | time: 56.462s


| Adam | epoch: 004 | loss: 0.48746 - acc: 0.7521 -- iter: 14784/24500


Training Step: 1381  | total loss: 

0.48904

 | time: 56.711s


| Adam | epoch: 004 | loss: 0.48904 - acc: 0.7519 -- iter: 14848/24500


Training Step: 1382  | total loss: 

0.49006

 | time: 56.951s


| Adam | epoch: 004 | loss: 0.49006 - acc: 0.7517 -- iter: 14912/24500


Training Step: 1383  | total loss: 

0.50238

 | time: 57.193s


| Adam | epoch: 004 | loss: 0.50238 - acc: 0.7453 -- iter: 14976/24500


Training Step: 1384  | total loss: 

0.49860

 | time: 57.445s


| Adam | epoch: 004 | loss: 0.49860 - acc: 0.7458 -- iter: 15040/24500


Training Step: 1385  | total loss: 

0.49409

 | time: 57.693s


| Adam | epoch: 004 | loss: 0.49409 - acc: 0.7524 -- iter: 15104/24500


Training Step: 1386  | total loss: 

0.49100

 | time: 57.947s


| Adam | epoch: 004 | loss: 0.49100 - acc: 0.7569 -- iter: 15168/24500


Training Step: 1387  | total loss: 

0.49681

 | time: 58.288s


| Adam | epoch: 004 | loss: 0.49681 - acc: 0.7531 -- iter: 15232/24500


Training Step: 1388  | total loss: 

0.49199

 | time: 58.543s


| Adam | epoch: 004 | loss: 0.49199 - acc: 0.7590 -- iter: 15296/24500


Training Step: 1389  | total loss: 

0.49751

 | time: 58.804s


| Adam | epoch: 004 | loss: 0.49751 - acc: 0.7550 -- iter: 15360/24500


Training Step: 1390  | total loss: 

0.50753

 | time: 59.050s


| Adam | epoch: 004 | loss: 0.50753 - acc: 0.7482 -- iter: 15424/24500


Training Step: 1391  | total loss: 

0.50132

 | time: 59.306s


| Adam | epoch: 004 | loss: 0.50132 - acc: 0.7547 -- iter: 15488/24500


Training Step: 1392  | total loss: 

0.50270

 | time: 59.541s


| Adam | epoch: 004 | loss: 0.50270 - acc: 0.7511 -- iter: 15552/24500


Training Step: 1393  | total loss: 

0.51305

 | time: 59.781s


| Adam | epoch: 004 | loss: 0.51305 - acc: 0.7447 -- iter: 15616/24500


Training Step: 1394  | total loss: 

0.51226

 | time: 60.036s


| Adam | epoch: 004 | loss: 0.51226 - acc: 0.7421 -- iter: 15680/24500


Training Step: 1395  | total loss: 

0.51284

 | time: 60.297s


| Adam | epoch: 004 | loss: 0.51284 - acc: 0.7429 -- iter: 15744/24500


Training Step: 1396  | total loss: 

0.50294

 | time: 60.552s


| Adam | epoch: 004 | loss: 0.50294 - acc: 0.7577 -- iter: 15808/24500


Training Step: 1397  | total loss: 

0.50193

 | time: 60.806s


| Adam | epoch: 004 | loss: 0.50193 - acc: 0.7585 -- iter: 15872/24500


Training Step: 1398  | total loss: 

0.49677

 | time: 61.057s


| Adam | epoch: 004 | loss: 0.49677 - acc: 0.7639 -- iter: 15936/24500


Training Step: 1399  | total loss: 

0.49468

 | time: 61.304s


| Adam | epoch: 004 | loss: 0.49468 - acc: 0.7687 -- iter: 16000/24500


Training Step: 1400  | total loss: 

0.49265

 | time: 61.549s


| Adam | epoch: 004 | loss: 0.49265 - acc: 0.7669 -- iter: 16064/24500


Training Step: 1401  | total loss: 

0.49080

 | time: 61.792s


| Adam | epoch: 004 | loss: 0.49080 - acc: 0.7699 -- iter: 16128/24500


Training Step: 1402  | total loss: 

0.49010

 | time: 62.035s


| Adam | epoch: 004 | loss: 0.49010 - acc: 0.7710 -- iter: 16192/24500


Training Step: 1403  | total loss: 

0.49516

 | time: 62.275s


| Adam | epoch: 004 | loss: 0.49516 - acc: 0.7705 -- iter: 16256/24500


Training Step: 1404  | total loss: 

0.47933

 | time: 62.513s


| Adam | epoch: 004 | loss: 0.47933 - acc: 0.7778 -- iter: 16320/24500


Training Step: 1405  | total loss: 

0.47378

 | time: 62.754s


| Adam | epoch: 004 | loss: 0.47378 - acc: 0.7860 -- iter: 16384/24500


Training Step: 1406  | total loss: 

0.47092

 | time: 62.994s


| Adam | epoch: 004 | loss: 0.47092 - acc: 0.7808 -- iter: 16448/24500


Training Step: 1407  | total loss: 

0.48608

 | time: 63.225s


| Adam | epoch: 004 | loss: 0.48608 - acc: 0.7793 -- iter: 16512/24500


Training Step: 1408  | total loss: 

0.48941

 | time: 63.481s


| Adam | epoch: 004 | loss: 0.48941 - acc: 0.7795 -- iter: 16576/24500


Training Step: 1409  | total loss: 

0.48479

 | time: 63.735s


| Adam | epoch: 004 | loss: 0.48479 - acc: 0.7797 -- iter: 16640/24500


Training Step: 1410  | total loss: 

0.47155

 | time: 63.978s


| Adam | epoch: 004 | loss: 0.47155 - acc: 0.7876 -- iter: 16704/24500


Training Step: 1411  | total loss: 

0.46805

 | time: 64.215s


| Adam | epoch: 004 | loss: 0.46805 - acc: 0.7901 -- iter: 16768/24500


Training Step: 1412  | total loss: 

0.47738

 | time: 64.460s


| Adam | epoch: 004 | loss: 0.47738 - acc: 0.7861 -- iter: 16832/24500


Training Step: 1413  | total loss: 

0.47295

 | time: 64.707s


| Adam | epoch: 004 | loss: 0.47295 - acc: 0.7872 -- iter: 16896/24500


Training Step: 1414  | total loss: 

0.47450

 | time: 64.946s


| Adam | epoch: 004 | loss: 0.47450 - acc: 0.7850 -- iter: 16960/24500


Training Step: 1415  | total loss: 

0.47152

 | time: 65.193s


| Adam | epoch: 004 | loss: 0.47152 - acc: 0.7800 -- iter: 17024/24500


Training Step: 1416  | total loss: 

0.47615

 | time: 65.435s


| Adam | epoch: 004 | loss: 0.47615 - acc: 0.7832 -- iter: 17088/24500


Training Step: 1417  | total loss: 

0.48198

 | time: 65.682s


| Adam | epoch: 004 | loss: 0.48198 - acc: 0.7815 -- iter: 17152/24500


Training Step: 1418  | total loss: 

0.48899

 | time: 65.929s


| Adam | epoch: 004 | loss: 0.48899 - acc: 0.7752 -- iter: 17216/24500


Training Step: 1419  | total loss: 

0.47588

 | time: 66.170s


| Adam | epoch: 004 | loss: 0.47588 - acc: 0.7836 -- iter: 17280/24500


Training Step: 1420  | total loss: 

0.47032

 | time: 66.413s


| Adam | epoch: 004 | loss: 0.47032 - acc: 0.7834 -- iter: 17344/24500


Training Step: 1421  | total loss: 

0.47731

 | time: 66.655s


| Adam | epoch: 004 | loss: 0.47731 - acc: 0.7785 -- iter: 17408/24500


Training Step: 1422  | total loss: 

0.46956

 | time: 66.899s


| Adam | epoch: 004 | loss: 0.46956 - acc: 0.7834 -- iter: 17472/24500


Training Step: 1423  | total loss: 

0.46999

 | time: 67.197s


| Adam | epoch: 004 | loss: 0.46999 - acc: 0.7817 -- iter: 17536/24500


Training Step: 1424  | total loss: 

0.46854

 | time: 67.447s


| Adam | epoch: 004 | loss: 0.46854 - acc: 0.7801 -- iter: 17600/24500


Training Step: 1425  | total loss: 

0.46230

 | time: 67.688s


| Adam | epoch: 004 | loss: 0.46230 - acc: 0.7817 -- iter: 17664/24500


Training Step: 1426  | total loss: 

0.46392

 | time: 67.935s


| Adam | epoch: 004 | loss: 0.46392 - acc: 0.7801 -- iter: 17728/24500


Training Step: 1427  | total loss: 

0.44631

 | time: 68.175s


| Adam | epoch: 004 | loss: 0.44631 - acc: 0.7896 -- iter: 17792/24500


Training Step: 1428  | total loss: 

0.45291

 | time: 68.422s


| Adam | epoch: 004 | loss: 0.45291 - acc: 0.7810 -- iter: 17856/24500


Training Step: 1429  | total loss: 

0.45162

 | time: 68.667s


| Adam | epoch: 004 | loss: 0.45162 - acc: 0.7794 -- iter: 17920/24500


Training Step: 1430  | total loss: 

0.45012

 | time: 68.918s


| Adam | epoch: 004 | loss: 0.45012 - acc: 0.7827 -- iter: 17984/24500


Training Step: 1431  | total loss: 

0.44342

 | time: 69.160s


| Adam | epoch: 004 | loss: 0.44342 - acc: 0.7841 -- iter: 18048/24500


Training Step: 1432  | total loss: 

0.43805

 | time: 69.407s


| Adam | epoch: 004 | loss: 0.43805 - acc: 0.7885 -- iter: 18112/24500


Training Step: 1433  | total loss: 

0.44202

 | time: 69.640s


| Adam | epoch: 004 | loss: 0.44202 - acc: 0.7909 -- iter: 18176/24500


Training Step: 1434  | total loss: 

0.44475

 | time: 69.881s


| Adam | epoch: 004 | loss: 0.44475 - acc: 0.7931 -- iter: 18240/24500


Training Step: 1435  | total loss: 

0.46614

 | time: 70.119s


| Adam | epoch: 004 | loss: 0.46614 - acc: 0.7841 -- iter: 18304/24500


Training Step: 1436  | total loss: 

0.46893

 | time: 70.366s


| Adam | epoch: 004 | loss: 0.46893 - acc: 0.7791 -- iter: 18368/24500


Training Step: 1437  | total loss: 

0.48066

 | time: 70.598s


| Adam | epoch: 004 | loss: 0.48066 - acc: 0.7668 -- iter: 18432/24500


Training Step: 1438  | total loss: 

0.47353

 | time: 70.842s


| Adam | epoch: 004 | loss: 0.47353 - acc: 0.7745 -- iter: 18496/24500


Training Step: 1439  | total loss: 

0.46610

 | time: 71.091s


| Adam | epoch: 004 | loss: 0.46610 - acc: 0.7768 -- iter: 18560/24500


Training Step: 1440  | total loss: 

0.46725

 | time: 71.338s


| Adam | epoch: 004 | loss: 0.46725 - acc: 0.7788 -- iter: 18624/24500


Training Step: 1441  | total loss: 

0.47486

 | time: 71.601s


| Adam | epoch: 004 | loss: 0.47486 - acc: 0.7681 -- iter: 18688/24500


Training Step: 1442  | total loss: 

0.47313

 | time: 71.854s


| Adam | epoch: 004 | loss: 0.47313 - acc: 0.7725 -- iter: 18752/24500


Training Step: 1443  | total loss: 

0.46582

 | time: 72.101s


| Adam | epoch: 004 | loss: 0.46582 - acc: 0.7750 -- iter: 18816/24500


Training Step: 1444  | total loss: 

0.47323

 | time: 72.360s


| Adam | epoch: 004 | loss: 0.47323 - acc: 0.7662 -- iter: 18880/24500


Training Step: 1445  | total loss: 

0.46630

 | time: 72.617s


| Adam | epoch: 004 | loss: 0.46630 - acc: 0.7693 -- iter: 18944/24500


Training Step: 1446  | total loss: 

0.46963

 | time: 72.878s


| Adam | epoch: 004 | loss: 0.46963 - acc: 0.7689 -- iter: 19008/24500


Training Step: 1447  | total loss: 

0.46783

 | time: 73.123s


| Adam | epoch: 004 | loss: 0.46783 - acc: 0.7717 -- iter: 19072/24500


Training Step: 1448  | total loss: 

0.47020

 | time: 73.353s


| Adam | epoch: 004 | loss: 0.47020 - acc: 0.7742 -- iter: 19136/24500


Training Step: 1449  | total loss: 

0.46426

 | time: 73.599s


| Adam | epoch: 004 | loss: 0.46426 - acc: 0.7796 -- iter: 19200/24500


Training Step: 1450  | total loss: 

0.46570

 | time: 73.844s


| Adam | epoch: 004 | loss: 0.46570 - acc: 0.7767 -- iter: 19264/24500


Training Step: 1451  | total loss: 

0.47440

 | time: 74.096s


| Adam | epoch: 004 | loss: 0.47440 - acc: 0.7740 -- iter: 19328/24500


Training Step: 1452  | total loss: 

0.47948

 | time: 74.345s


| Adam | epoch: 004 | loss: 0.47948 - acc: 0.7685 -- iter: 19392/24500


Training Step: 1453  | total loss: 

0.47340

 | time: 74.594s


| Adam | epoch: 004 | loss: 0.47340 - acc: 0.7697 -- iter: 19456/24500


Training Step: 1454  | total loss: 

0.46616

 | time: 74.837s


| Adam | epoch: 004 | loss: 0.46616 - acc: 0.7803 -- iter: 19520/24500


Training Step: 1455  | total loss: 

0.46152

 | time: 75.070s


| Adam | epoch: 004 | loss: 0.46152 - acc: 0.7866 -- iter: 19584/24500


Training Step: 1456  | total loss: 

0.45974

 | time: 75.319s


| Adam | epoch: 004 | loss: 0.45974 - acc: 0.7908 -- iter: 19648/24500


Training Step: 1457  | total loss: 

0.48381

 | time: 75.563s


| Adam | epoch: 004 | loss: 0.48381 - acc: 0.7804 -- iter: 19712/24500


Training Step: 1458  | total loss: 

0.47709

 | time: 75.797s


| Adam | epoch: 004 | loss: 0.47709 - acc: 0.7852 -- iter: 19776/24500


Training Step: 1459  | total loss: 

0.47552

 | time: 76.038s


| Adam | epoch: 004 | loss: 0.47552 - acc: 0.7879 -- iter: 19840/24500


Training Step: 1460  | total loss: 

0.48131

 | time: 76.287s


| Adam | epoch: 004 | loss: 0.48131 - acc: 0.7873 -- iter: 19904/24500


Training Step: 1461  | total loss: 

0.47944

 | time: 76.535s


| Adam | epoch: 004 | loss: 0.47944 - acc: 0.7851 -- iter: 19968/24500


Training Step: 1462  | total loss: 

0.47867

 | time: 76.784s


| Adam | epoch: 004 | loss: 0.47867 - acc: 0.7847 -- iter: 20032/24500


Training Step: 1463  | total loss: 

0.47467

 | time: 77.029s


| Adam | epoch: 004 | loss: 0.47467 - acc: 0.7875 -- iter: 20096/24500


Training Step: 1464  | total loss: 

0.47507

 | time: 77.269s


| Adam | epoch: 004 | loss: 0.47507 - acc: 0.7806 -- iter: 20160/24500


Training Step: 1465  | total loss: 

0.48283

 | time: 77.512s


| Adam | epoch: 004 | loss: 0.48283 - acc: 0.7729 -- iter: 20224/24500


Training Step: 1466  | total loss: 

0.48864

 | time: 77.757s


| Adam | epoch: 004 | loss: 0.48864 - acc: 0.7706 -- iter: 20288/24500


Training Step: 1467  | total loss: 

0.49075

 | time: 78.012s


| Adam | epoch: 004 | loss: 0.49075 - acc: 0.7685 -- iter: 20352/24500


Training Step: 1468  | total loss: 

0.49815

 | time: 78.257s


| Adam | epoch: 004 | loss: 0.49815 - acc: 0.7573 -- iter: 20416/24500


Training Step: 1469  | total loss: 

0.50205

 | time: 78.503s


| Adam | epoch: 004 | loss: 0.50205 - acc: 0.7550 -- iter: 20480/24500


Training Step: 1470  | total loss: 

0.49511

 | time: 78.746s


| Adam | epoch: 004 | loss: 0.49511 - acc: 0.7592 -- iter: 20544/24500


Training Step: 1471  | total loss: 

0.49258

 | time: 78.992s


| Adam | epoch: 004 | loss: 0.49258 - acc: 0.7614 -- iter: 20608/24500


Training Step: 1472  | total loss: 

0.49756

 | time: 79.231s


| Adam | epoch: 004 | loss: 0.49756 - acc: 0.7540 -- iter: 20672/24500


Training Step: 1473  | total loss: 

0.48380

 | time: 79.473s


| Adam | epoch: 004 | loss: 0.48380 - acc: 0.7630 -- iter: 20736/24500


Training Step: 1474  | total loss: 

0.47743

 | time: 79.723s


| Adam | epoch: 004 | loss: 0.47743 - acc: 0.7711 -- iter: 20800/24500


Training Step: 1475  | total loss: 

0.47298

 | time: 79.959s


| Adam | epoch: 004 | loss: 0.47298 - acc: 0.7752 -- iter: 20864/24500


Training Step: 1476  | total loss: 

0.46971

 | time: 80.204s


| Adam | epoch: 004 | loss: 0.46971 - acc: 0.7821 -- iter: 20928/24500


Training Step: 1477  | total loss: 

0.47313

 | time: 80.457s


| Adam | epoch: 004 | loss: 0.47313 - acc: 0.7773 -- iter: 20992/24500


Training Step: 1478  | total loss: 

0.47866

 | time: 80.698s


| Adam | epoch: 004 | loss: 0.47866 - acc: 0.7699 -- iter: 21056/24500


Training Step: 1479  | total loss: 

0.49014

 | time: 80.944s


| Adam | epoch: 004 | loss: 0.49014 - acc: 0.7616 -- iter: 21120/24500


Training Step: 1480  | total loss: 

0.48337

 | time: 81.195s


| Adam | epoch: 004 | loss: 0.48337 - acc: 0.7667 -- iter: 21184/24500


Training Step: 1481  | total loss: 

0.48946

 | time: 81.432s


| Adam | epoch: 004 | loss: 0.48946 - acc: 0.7635 -- iter: 21248/24500


Training Step: 1482  | total loss: 

0.49106

 | time: 81.677s


| Adam | epoch: 004 | loss: 0.49106 - acc: 0.7637 -- iter: 21312/24500


Training Step: 1483  | total loss: 

0.48549

 | time: 81.921s


| Adam | epoch: 004 | loss: 0.48549 - acc: 0.7686 -- iter: 21376/24500


Training Step: 1484  | total loss: 

0.47988

 | time: 82.156s


| Adam | epoch: 004 | loss: 0.47988 - acc: 0.7714 -- iter: 21440/24500


Training Step: 1485  | total loss: 

0.47526

 | time: 82.402s


| Adam | epoch: 004 | loss: 0.47526 - acc: 0.7740 -- iter: 21504/24500


Training Step: 1486  | total loss: 

0.47984

 | time: 82.642s


| Adam | epoch: 004 | loss: 0.47984 - acc: 0.7731 -- iter: 21568/24500


Training Step: 1487  | total loss: 

0.47542

 | time: 82.890s


| Adam | epoch: 004 | loss: 0.47542 - acc: 0.7786 -- iter: 21632/24500


Training Step: 1488  | total loss: 

0.47836

 | time: 83.135s


| Adam | epoch: 004 | loss: 0.47836 - acc: 0.7789 -- iter: 21696/24500


Training Step: 1489  | total loss: 

0.46501

 | time: 83.376s


| Adam | epoch: 004 | loss: 0.46501 - acc: 0.7869 -- iter: 21760/24500


Training Step: 1490  | total loss: 

0.47630

 | time: 83.623s


| Adam | epoch: 004 | loss: 0.47630 - acc: 0.7848 -- iter: 21824/24500


Training Step: 1491  | total loss: 

0.47786

 | time: 83.870s


| Adam | epoch: 004 | loss: 0.47786 - acc: 0.7766 -- iter: 21888/24500


Training Step: 1492  | total loss: 

0.46977

 | time: 84.110s


| Adam | epoch: 004 | loss: 0.46977 - acc: 0.7802 -- iter: 21952/24500


Training Step: 1493  | total loss: 

0.47218

 | time: 84.359s


| Adam | epoch: 004 | loss: 0.47218 - acc: 0.7756 -- iter: 22016/24500


Training Step: 1494  | total loss: 

0.47680

 | time: 84.611s


| Adam | epoch: 004 | loss: 0.47680 - acc: 0.7731 -- iter: 22080/24500


Training Step: 1495  | total loss: 

0.46751

 | time: 84.864s


| Adam | epoch: 004 | loss: 0.46751 - acc: 0.7801 -- iter: 22144/24500


Training Step: 1496  | total loss: 

0.46675

 | time: 85.103s


| Adam | epoch: 004 | loss: 0.46675 - acc: 0.7818 -- iter: 22208/24500


Training Step: 1497  | total loss: 

0.46439

 | time: 85.351s


| Adam | epoch: 004 | loss: 0.46439 - acc: 0.7802 -- iter: 22272/24500


Training Step: 1498  | total loss: 

0.46651

 | time: 85.612s


| Adam | epoch: 004 | loss: 0.46651 - acc: 0.7819 -- iter: 22336/24500


Training Step: 1499  | total loss: 

0.46145

 | time: 85.859s


| Adam | epoch: 004 | loss: 0.46145 - acc: 0.7834 -- iter: 22400/24500


Training Step: 1500  | total loss: 

0.45879

 | time: 87.114s


| Adam | epoch: 004 | loss: 0.45879 - acc: 0.7863 | val_loss: 0.49321 - val_acc: 0.7660 -- iter: 22464/24500
--


Training Step: 1501  | total loss: 

0.45876

 | time: 87.351s


| Adam | epoch: 004 | loss: 0.45876 - acc: 0.7889 -- iter: 22528/24500


Training Step: 1502  | total loss: 

0.46922

 | time: 87.593s


| Adam | epoch: 004 | loss: 0.46922 - acc: 0.7803 -- iter: 22592/24500


Training Step: 1503  | total loss: 

0.46812

 | time: 87.843s


| Adam | epoch: 004 | loss: 0.46812 - acc: 0.7804 -- iter: 22656/24500


Training Step: 1504  | total loss: 

0.51579

 | time: 88.086s


| Adam | epoch: 004 | loss: 0.51579 - acc: 0.7617 -- iter: 22720/24500


Training Step: 1505  | total loss: 

0.51121

 | time: 88.338s


| Adam | epoch: 004 | loss: 0.51121 - acc: 0.7637 -- iter: 22784/24500


Training Step: 1506  | total loss: 

0.50535

 | time: 88.591s


| Adam | epoch: 004 | loss: 0.50535 - acc: 0.7670 -- iter: 22848/24500


Training Step: 1507  | total loss: 

0.50916

 | time: 88.850s


| Adam | epoch: 004 | loss: 0.50916 - acc: 0.7653 -- iter: 22912/24500


Training Step: 1508  | total loss: 

0.50071

 | time: 89.099s


| Adam | epoch: 004 | loss: 0.50071 - acc: 0.7732 -- iter: 22976/24500


Training Step: 1509  | total loss: 

0.48324

 | time: 89.340s


| Adam | epoch: 004 | loss: 0.48324 - acc: 0.7865 -- iter: 23040/24500


Training Step: 1510  | total loss: 

0.47908

 | time: 89.586s


| Adam | epoch: 004 | loss: 0.47908 - acc: 0.7891 -- iter: 23104/24500


Training Step: 1511  | total loss: 

0.47171

 | time: 89.823s


| Adam | epoch: 004 | loss: 0.47171 - acc: 0.7899 -- iter: 23168/24500


Training Step: 1512  | total loss: 

0.45888

 | time: 90.068s


| Adam | epoch: 004 | loss: 0.45888 - acc: 0.7999 -- iter: 23232/24500


Training Step: 1513  | total loss: 

0.46019

 | time: 90.308s


| Adam | epoch: 004 | loss: 0.46019 - acc: 0.7949 -- iter: 23296/24500


Training Step: 1514  | total loss: 

0.45032

 | time: 90.543s


| Adam | epoch: 004 | loss: 0.45032 - acc: 0.8029 -- iter: 23360/24500


Training Step: 1515  | total loss: 

0.44605

 | time: 90.792s


| Adam | epoch: 004 | loss: 0.44605 - acc: 0.8023 -- iter: 23424/24500


Training Step: 1516  | total loss: 

0.43448

 | time: 91.041s


| Adam | epoch: 004 | loss: 0.43448 - acc: 0.8112 -- iter: 23488/24500


Training Step: 1517  | total loss: 

0.43517

 | time: 91.284s


| Adam | epoch: 004 | loss: 0.43517 - acc: 0.8050 -- iter: 23552/24500


Training Step: 1518  | total loss: 

0.44128

 | time: 91.523s


| Adam | epoch: 004 | loss: 0.44128 - acc: 0.8027 -- iter: 23616/24500


Training Step: 1519  | total loss: 

0.45122

 | time: 91.776s


| Adam | epoch: 004 | loss: 0.45122 - acc: 0.7943 -- iter: 23680/24500


Training Step: 1520  | total loss: 

0.45398

 | time: 92.022s


| Adam | epoch: 004 | loss: 0.45398 - acc: 0.7992 -- iter: 23744/24500


Training Step: 1521  | total loss: 

0.45795

 | time: 92.265s


| Adam | epoch: 004 | loss: 0.45795 - acc: 0.8006 -- iter: 23808/24500


Training Step: 1522  | total loss: 

0.45270

 | time: 92.521s


| Adam | epoch: 004 | loss: 0.45270 - acc: 0.8033 -- iter: 23872/24500


Training Step: 1523  | total loss: 

0.46290

 | time: 92.764s


| Adam | epoch: 004 | loss: 0.46290 - acc: 0.7933 -- iter: 23936/24500


Training Step: 1524  | total loss: 

0.45835

 | time: 93.004s


| Adam | epoch: 004 | loss: 0.45835 - acc: 0.7983 -- iter: 24000/24500


Training Step: 1525  | total loss: 

0.46167

 | time: 93.245s


| Adam | epoch: 004 | loss: 0.46167 - acc: 0.7966 -- iter: 24064/24500


Training Step: 1526  | total loss: 

0.46790

 | time: 93.486s


| Adam | epoch: 004 | loss: 0.46790 - acc: 0.7888 -- iter: 24128/24500


Training Step: 1527  | total loss: 

0.46858

 | time: 93.731s


| Adam | epoch: 004 | loss: 0.46858 - acc: 0.7896 -- iter: 24192/24500


Training Step: 1528  | total loss: 

0.46553

 | time: 93.977s


| Adam | epoch: 004 | loss: 0.46553 - acc: 0.7872 -- iter: 24256/24500


Training Step: 1529  | total loss: 

0.45416

 | time: 94.219s


| Adam | epoch: 004 | loss: 0.45416 - acc: 0.7960 -- iter: 24320/24500


Training Step: 1530  | total loss: 

0.46244

 | time: 94.461s


| Adam | epoch: 004 | loss: 0.46244 - acc: 0.7883 -- iter: 24384/24500


Training Step: 1531  | total loss: 

0.45738

 | time: 94.700s


| Adam | epoch: 004 | loss: 0.45738 - acc: 0.7923 -- iter: 24448/24500


Training Step: 1532  | total loss: 

0.46051

 | time: 95.940s


| Adam | epoch: 004 | loss: 0.46051 - acc: 0.7943 | val_loss: 0.49823 - val_acc: 0.7720 -- iter: 24500/24500
--


Training Step: 1533  | total loss: 

0.46858

 | time: 0.245s


| Adam | epoch: 005 | loss: 0.46858 - acc: 0.7852 -- iter: 00064/24500


Training Step: 1534  | total loss: 

0.47435

 | time: 0.483s


| Adam | epoch: 005 | loss: 0.47435 - acc: 0.7832 -- iter: 00128/24500


Training Step: 1535  | total loss: 

0.47168

 | time: 0.688s


| Adam | epoch: 005 | loss: 0.47168 - acc: 0.7877 -- iter: 00192/24500


Training Step: 1536  | total loss: 

0.46192

 | time: 0.884s


| Adam | epoch: 005 | loss: 0.46192 - acc: 0.7955 -- iter: 00256/24500


Training Step: 1537  | total loss: 

0.45183

 | time: 1.124s


| Adam | epoch: 005 | loss: 0.45183 - acc: 0.8025 -- iter: 00320/24500


Training Step: 1538  | total loss: 

0.45301

 | time: 1.364s


| Adam | epoch: 005 | loss: 0.45301 - acc: 0.8003 -- iter: 00384/24500


Training Step: 1539  | total loss: 

0.45502

 | time: 1.608s


| Adam | epoch: 005 | loss: 0.45502 - acc: 0.7984 -- iter: 00448/24500


Training Step: 1540  | total loss: 

0.45657

 | time: 1.847s


| Adam | epoch: 005 | loss: 0.45657 - acc: 0.7998 -- iter: 00512/24500


Training Step: 1541  | total loss: 

0.46529

 | time: 2.094s


| Adam | epoch: 005 | loss: 0.46529 - acc: 0.7886 -- iter: 00576/24500


Training Step: 1542  | total loss: 

0.46252

 | time: 2.337s


| Adam | epoch: 005 | loss: 0.46252 - acc: 0.7879 -- iter: 00640/24500


Training Step: 1543  | total loss: 

0.47887

 | time: 2.581s


| Adam | epoch: 005 | loss: 0.47887 - acc: 0.7778 -- iter: 00704/24500


Training Step: 1544  | total loss: 

0.47922

 | time: 2.818s


| Adam | epoch: 005 | loss: 0.47922 - acc: 0.7797 -- iter: 00768/24500


Training Step: 1545  | total loss: 

0.48138

 | time: 3.062s


| Adam | epoch: 005 | loss: 0.48138 - acc: 0.7768 -- iter: 00832/24500


Training Step: 1546  | total loss: 

0.46754

 | time: 3.302s


| Adam | epoch: 005 | loss: 0.46754 - acc: 0.7866 -- iter: 00896/24500


Training Step: 1547  | total loss: 

0.47105

 | time: 3.546s


| Adam | epoch: 005 | loss: 0.47105 - acc: 0.7829 -- iter: 00960/24500


Training Step: 1548  | total loss: 

0.46883

 | time: 3.783s


| Adam | epoch: 005 | loss: 0.46883 - acc: 0.7843 -- iter: 01024/24500


Training Step: 1549  | total loss: 

0.45948

 | time: 4.026s


| Adam | epoch: 005 | loss: 0.45948 - acc: 0.7871 -- iter: 01088/24500


Training Step: 1550  | total loss: 

0.45798

 | time: 4.278s


| Adam | epoch: 005 | loss: 0.45798 - acc: 0.7928 -- iter: 01152/24500


Training Step: 1551  | total loss: 

0.44819

 | time: 4.535s


| Adam | epoch: 005 | loss: 0.44819 - acc: 0.7995 -- iter: 01216/24500


Training Step: 1552  | total loss: 

0.43505

 | time: 4.778s


| Adam | epoch: 005 | loss: 0.43505 - acc: 0.8117 -- iter: 01280/24500


Training Step: 1553  | total loss: 

0.42937

 | time: 5.018s


| Adam | epoch: 005 | loss: 0.42937 - acc: 0.8102 -- iter: 01344/24500


Training Step: 1554  | total loss: 

0.42511

 | time: 5.266s


| Adam | epoch: 005 | loss: 0.42511 - acc: 0.8089 -- iter: 01408/24500


Training Step: 1555  | total loss: 

0.42451

 | time: 5.507s


| Adam | epoch: 005 | loss: 0.42451 - acc: 0.8092 -- iter: 01472/24500


Training Step: 1556  | total loss: 

0.43029

 | time: 5.744s


| Adam | epoch: 005 | loss: 0.43029 - acc: 0.8049 -- iter: 01536/24500


Training Step: 1557  | total loss: 

0.44327

 | time: 5.983s


| Adam | epoch: 005 | loss: 0.44327 - acc: 0.7994 -- iter: 01600/24500


Training Step: 1558  | total loss: 

0.45593

 | time: 6.234s


| Adam | epoch: 005 | loss: 0.45593 - acc: 0.7866 -- iter: 01664/24500


Training Step: 1559  | total loss: 

0.44468

 | time: 6.484s


| Adam | epoch: 005 | loss: 0.44468 - acc: 0.7908 -- iter: 01728/24500


Training Step: 1560  | total loss: 

0.44483

 | time: 6.729s


| Adam | epoch: 005 | loss: 0.44483 - acc: 0.7914 -- iter: 01792/24500


Training Step: 1561  | total loss: 

0.44254

 | time: 6.974s


| Adam | epoch: 005 | loss: 0.44254 - acc: 0.7919 -- iter: 01856/24500


Training Step: 1562  | total loss: 

0.44098

 | time: 7.217s


| Adam | epoch: 005 | loss: 0.44098 - acc: 0.7956 -- iter: 01920/24500


Training Step: 1563  | total loss: 

0.45252

 | time: 7.460s


| Adam | epoch: 005 | loss: 0.45252 - acc: 0.7879 -- iter: 01984/24500


Training Step: 1564  | total loss: 

0.45342

 | time: 7.704s


| Adam | epoch: 005 | loss: 0.45342 - acc: 0.7872 -- iter: 02048/24500


Training Step: 1565  | total loss: 

0.45489

 | time: 7.942s


| Adam | epoch: 005 | loss: 0.45489 - acc: 0.7819 -- iter: 02112/24500


Training Step: 1566  | total loss: 

0.43951

 | time: 8.186s


| Adam | epoch: 005 | loss: 0.43951 - acc: 0.7912 -- iter: 02176/24500


Training Step: 1567  | total loss: 

0.43078

 | time: 8.420s


| Adam | epoch: 005 | loss: 0.43078 - acc: 0.7965 -- iter: 02240/24500


Training Step: 1568  | total loss: 

0.43358

 | time: 8.671s


| Adam | epoch: 005 | loss: 0.43358 - acc: 0.7918 -- iter: 02304/24500


Training Step: 1569  | total loss: 

0.44777

 | time: 8.911s


| Adam | epoch: 005 | loss: 0.44777 - acc: 0.7845 -- iter: 02368/24500


Training Step: 1570  | total loss: 

0.44774

 | time: 9.156s


| Adam | epoch: 005 | loss: 0.44774 - acc: 0.7873 -- iter: 02432/24500


Training Step: 1571  | total loss: 

0.44907

 | time: 9.407s


| Adam | epoch: 005 | loss: 0.44907 - acc: 0.7914 -- iter: 02496/24500


Training Step: 1572  | total loss: 

0.44714

 | time: 9.643s


| Adam | epoch: 005 | loss: 0.44714 - acc: 0.7904 -- iter: 02560/24500


Training Step: 1573  | total loss: 

0.44891

 | time: 9.882s


| Adam | epoch: 005 | loss: 0.44891 - acc: 0.7848 -- iter: 02624/24500


Training Step: 1574  | total loss: 

0.44635

 | time: 10.123s


| Adam | epoch: 005 | loss: 0.44635 - acc: 0.7829 -- iter: 02688/24500


Training Step: 1575  | total loss: 

0.45548

 | time: 10.365s


| Adam | epoch: 005 | loss: 0.45548 - acc: 0.7749 -- iter: 02752/24500


Training Step: 1576  | total loss: 

0.45525

 | time: 10.605s


| Adam | epoch: 005 | loss: 0.45525 - acc: 0.7724 -- iter: 02816/24500


Training Step: 1577  | total loss: 

0.46068

 | time: 10.848s


| Adam | epoch: 005 | loss: 0.46068 - acc: 0.7702 -- iter: 02880/24500


Training Step: 1578  | total loss: 

0.45664

 | time: 11.090s


| Adam | epoch: 005 | loss: 0.45664 - acc: 0.7744 -- iter: 02944/24500


Training Step: 1579  | total loss: 

0.44908

 | time: 11.337s


| Adam | epoch: 005 | loss: 0.44908 - acc: 0.7766 -- iter: 03008/24500


Training Step: 1580  | total loss: 

0.46208

 | time: 11.581s


| Adam | epoch: 005 | loss: 0.46208 - acc: 0.7709 -- iter: 03072/24500


Training Step: 1581  | total loss: 

0.46410

 | time: 11.821s


| Adam | epoch: 005 | loss: 0.46410 - acc: 0.7703 -- iter: 03136/24500


Training Step: 1582  | total loss: 

0.45900

 | time: 12.068s


| Adam | epoch: 005 | loss: 0.45900 - acc: 0.7730 -- iter: 03200/24500


Training Step: 1583  | total loss: 

0.46017

 | time: 12.318s


| Adam | epoch: 005 | loss: 0.46017 - acc: 0.7723 -- iter: 03264/24500


Training Step: 1584  | total loss: 

0.46714

 | time: 12.562s


| Adam | epoch: 005 | loss: 0.46714 - acc: 0.7653 -- iter: 03328/24500


Training Step: 1585  | total loss: 

0.46618

 | time: 12.801s


| Adam | epoch: 005 | loss: 0.46618 - acc: 0.7669 -- iter: 03392/24500


Training Step: 1586  | total loss: 

0.46298

 | time: 13.038s


| Adam | epoch: 005 | loss: 0.46298 - acc: 0.7699 -- iter: 03456/24500


Training Step: 1587  | total loss: 

0.46961

 | time: 13.274s


| Adam | epoch: 005 | loss: 0.46961 - acc: 0.7648 -- iter: 03520/24500


Training Step: 1588  | total loss: 

0.47584

 | time: 13.509s


| Adam | epoch: 005 | loss: 0.47584 - acc: 0.7618 -- iter: 03584/24500


Training Step: 1589  | total loss: 

0.48244

 | time: 13.748s


| Adam | epoch: 005 | loss: 0.48244 - acc: 0.7559 -- iter: 03648/24500


Training Step: 1590  | total loss: 

0.47206

 | time: 13.981s


| Adam | epoch: 005 | loss: 0.47206 - acc: 0.7694 -- iter: 03712/24500


Training Step: 1591  | total loss: 

0.45723

 | time: 14.228s


| Adam | epoch: 005 | loss: 0.45723 - acc: 0.7815 -- iter: 03776/24500


Training Step: 1592  | total loss: 

0.46179

 | time: 14.481s


| Adam | epoch: 005 | loss: 0.46179 - acc: 0.7783 -- iter: 03840/24500


Training Step: 1593  | total loss: 

0.45107

 | time: 14.727s


| Adam | epoch: 005 | loss: 0.45107 - acc: 0.7927 -- iter: 03904/24500


Training Step: 1594  | total loss: 

0.44720

 | time: 14.968s


| Adam | epoch: 005 | loss: 0.44720 - acc: 0.8009 -- iter: 03968/24500


Training Step: 1595  | total loss: 

0.44906

 | time: 15.265s


| Adam | epoch: 005 | loss: 0.44906 - acc: 0.8021 -- iter: 04032/24500


Training Step: 1596  | total loss: 

0.45264

 | time: 15.512s


| Adam | epoch: 005 | loss: 0.45264 - acc: 0.7969 -- iter: 04096/24500


Training Step: 1597  | total loss: 

0.45031

 | time: 15.750s


| Adam | epoch: 005 | loss: 0.45031 - acc: 0.7984 -- iter: 04160/24500


Training Step: 1598  | total loss: 

0.44187

 | time: 15.994s


| Adam | epoch: 005 | loss: 0.44187 - acc: 0.8030 -- iter: 04224/24500


Training Step: 1599  | total loss: 

0.45011

 | time: 16.244s


| Adam | epoch: 005 | loss: 0.45011 - acc: 0.8024 -- iter: 04288/24500


Training Step: 1600  | total loss: 

0.44307

 | time: 16.494s


| Adam | epoch: 005 | loss: 0.44307 - acc: 0.8065 -- iter: 04352/24500


Training Step: 1601  | total loss: 

0.44481

 | time: 16.754s


| Adam | epoch: 005 | loss: 0.44481 - acc: 0.8024 -- iter: 04416/24500


Training Step: 1602  | total loss: 

0.43993

 | time: 16.994s


| Adam | epoch: 005 | loss: 0.43993 - acc: 0.8034 -- iter: 04480/24500


Training Step: 1603  | total loss: 

0.43619

 | time: 17.240s


| Adam | epoch: 005 | loss: 0.43619 - acc: 0.8059 -- iter: 04544/24500


Training Step: 1604  | total loss: 

0.42616

 | time: 17.490s


| Adam | epoch: 005 | loss: 0.42616 - acc: 0.8066 -- iter: 04608/24500


Training Step: 1605  | total loss: 

0.43472

 | time: 17.718s


| Adam | epoch: 005 | loss: 0.43472 - acc: 0.7946 -- iter: 04672/24500


Training Step: 1606  | total loss: 

0.43242

 | time: 17.977s


| Adam | epoch: 005 | loss: 0.43242 - acc: 0.7933 -- iter: 04736/24500


Training Step: 1607  | total loss: 

0.44597

 | time: 18.210s


| Adam | epoch: 005 | loss: 0.44597 - acc: 0.7859 -- iter: 04800/24500


Training Step: 1608  | total loss: 

0.45141

 | time: 18.462s


| Adam | epoch: 005 | loss: 0.45141 - acc: 0.7854 -- iter: 04864/24500


Training Step: 1609  | total loss: 

0.45919

 | time: 18.700s


| Adam | epoch: 005 | loss: 0.45919 - acc: 0.7756 -- iter: 04928/24500


Training Step: 1610  | total loss: 

0.45146

 | time: 18.942s


| Adam | epoch: 005 | loss: 0.45146 - acc: 0.7809 -- iter: 04992/24500


Training Step: 1611  | total loss: 

0.45134

 | time: 19.183s


| Adam | epoch: 005 | loss: 0.45134 - acc: 0.7793 -- iter: 05056/24500


Training Step: 1612  | total loss: 

0.45243

 | time: 19.436s


| Adam | epoch: 005 | loss: 0.45243 - acc: 0.7811 -- iter: 05120/24500


Training Step: 1613  | total loss: 

0.44416

 | time: 19.683s


| Adam | epoch: 005 | loss: 0.44416 - acc: 0.7874 -- iter: 05184/24500


Training Step: 1614  | total loss: 

0.43155

 | time: 19.931s


| Adam | epoch: 005 | loss: 0.43155 - acc: 0.7961 -- iter: 05248/24500


Training Step: 1615  | total loss: 

0.43137

 | time: 20.183s


| Adam | epoch: 005 | loss: 0.43137 - acc: 0.7946 -- iter: 05312/24500


Training Step: 1616  | total loss: 

0.43231

 | time: 20.436s


| Adam | epoch: 005 | loss: 0.43231 - acc: 0.7933 -- iter: 05376/24500


Training Step: 1617  | total loss: 

0.44343

 | time: 20.680s


| Adam | epoch: 005 | loss: 0.44343 - acc: 0.7874 -- iter: 05440/24500


Training Step: 1618  | total loss: 

0.44350

 | time: 20.922s


| Adam | epoch: 005 | loss: 0.44350 - acc: 0.7930 -- iter: 05504/24500


Training Step: 1619  | total loss: 

0.44077

 | time: 21.168s


| Adam | epoch: 005 | loss: 0.44077 - acc: 0.7981 -- iter: 05568/24500


Training Step: 1620  | total loss: 

0.43439

 | time: 21.411s


| Adam | epoch: 005 | loss: 0.43439 - acc: 0.8042 -- iter: 05632/24500


Training Step: 1621  | total loss: 

0.43959

 | time: 21.661s


| Adam | epoch: 005 | loss: 0.43959 - acc: 0.8051 -- iter: 05696/24500


Training Step: 1622  | total loss: 

0.43172

 | time: 21.899s


| Adam | epoch: 005 | loss: 0.43172 - acc: 0.8074 -- iter: 05760/24500


Training Step: 1623  | total loss: 

0.43950

 | time: 22.147s


| Adam | epoch: 005 | loss: 0.43950 - acc: 0.7969 -- iter: 05824/24500


Training Step: 1624  | total loss: 

0.45147

 | time: 22.401s


| Adam | epoch: 005 | loss: 0.45147 - acc: 0.7876 -- iter: 05888/24500


Training Step: 1625  | total loss: 

0.44522

 | time: 22.638s


| Adam | epoch: 005 | loss: 0.44522 - acc: 0.7901 -- iter: 05952/24500


Training Step: 1626  | total loss: 

0.43600

 | time: 22.885s


| Adam | epoch: 005 | loss: 0.43600 - acc: 0.8017 -- iter: 06016/24500


Training Step: 1627  | total loss: 

0.43993

 | time: 23.128s


| Adam | epoch: 005 | loss: 0.43993 - acc: 0.8012 -- iter: 06080/24500


Training Step: 1628  | total loss: 

0.44341

 | time: 23.383s


| Adam | epoch: 005 | loss: 0.44341 - acc: 0.7961 -- iter: 06144/24500


Training Step: 1629  | total loss: 

0.44100

 | time: 23.619s


| Adam | epoch: 005 | loss: 0.44100 - acc: 0.7962 -- iter: 06208/24500


Training Step: 1630  | total loss: 

0.44159

 | time: 23.869s


| Adam | epoch: 005 | loss: 0.44159 - acc: 0.7947 -- iter: 06272/24500


Training Step: 1631  | total loss: 

0.44525

 | time: 24.113s


| Adam | epoch: 005 | loss: 0.44525 - acc: 0.7949 -- iter: 06336/24500


Training Step: 1632  | total loss: 

0.44051

 | time: 24.364s


| Adam | epoch: 005 | loss: 0.44051 - acc: 0.7982 -- iter: 06400/24500


Training Step: 1633  | total loss: 

0.44290

 | time: 24.616s


| Adam | epoch: 005 | loss: 0.44290 - acc: 0.7965 -- iter: 06464/24500


Training Step: 1634  | total loss: 

0.42571

 | time: 24.868s


| Adam | epoch: 005 | loss: 0.42571 - acc: 0.8059 -- iter: 06528/24500


Training Step: 1635  | total loss: 

0.41963

 | time: 25.126s


| Adam | epoch: 005 | loss: 0.41963 - acc: 0.8128 -- iter: 06592/24500


Training Step: 1636  | total loss: 

0.42566

 | time: 25.377s


| Adam | epoch: 005 | loss: 0.42566 - acc: 0.8019 -- iter: 06656/24500


Training Step: 1637  | total loss: 

0.44163

 | time: 25.639s


| Adam | epoch: 005 | loss: 0.44163 - acc: 0.7873 -- iter: 06720/24500


Training Step: 1638  | total loss: 

0.43496

 | time: 25.890s


| Adam | epoch: 005 | loss: 0.43496 - acc: 0.7914 -- iter: 06784/24500


Training Step: 1639  | total loss: 

0.43572

 | time: 26.141s


| Adam | epoch: 005 | loss: 0.43572 - acc: 0.7919 -- iter: 06848/24500


Training Step: 1640  | total loss: 

0.43764

 | time: 26.387s


| Adam | epoch: 005 | loss: 0.43764 - acc: 0.7987 -- iter: 06912/24500


Training Step: 1641  | total loss: 

0.43874

 | time: 26.651s


| Adam | epoch: 005 | loss: 0.43874 - acc: 0.7985 -- iter: 06976/24500


Training Step: 1642  | total loss: 

0.44685

 | time: 26.903s


| Adam | epoch: 005 | loss: 0.44685 - acc: 0.7921 -- iter: 07040/24500


Training Step: 1643  | total loss: 

0.44098

 | time: 27.144s


| Adam | epoch: 005 | loss: 0.44098 - acc: 0.8004 -- iter: 07104/24500


Training Step: 1644  | total loss: 

0.43973

 | time: 27.403s


| Adam | epoch: 005 | loss: 0.43973 - acc: 0.7953 -- iter: 07168/24500


Training Step: 1645  | total loss: 

0.44620

 | time: 27.659s


| Adam | epoch: 005 | loss: 0.44620 - acc: 0.7955 -- iter: 07232/24500


Training Step: 1646  | total loss: 

0.43916

 | time: 27.911s


| Adam | epoch: 005 | loss: 0.43916 - acc: 0.8034 -- iter: 07296/24500


Training Step: 1647  | total loss: 

0.44539

 | time: 28.165s


| Adam | epoch: 005 | loss: 0.44539 - acc: 0.8043 -- iter: 07360/24500


Training Step: 1648  | total loss: 

0.44890

 | time: 28.413s


| Adam | epoch: 005 | loss: 0.44890 - acc: 0.8052 -- iter: 07424/24500


Training Step: 1649  | total loss: 

0.44749

 | time: 28.670s


| Adam | epoch: 005 | loss: 0.44749 - acc: 0.8028 -- iter: 07488/24500


Training Step: 1650  | total loss: 

0.45547

 | time: 28.930s


| Adam | epoch: 005 | loss: 0.45547 - acc: 0.8006 -- iter: 07552/24500


Training Step: 1651  | total loss: 

0.44841

 | time: 29.184s


| Adam | epoch: 005 | loss: 0.44841 - acc: 0.8002 -- iter: 07616/24500


Training Step: 1652  | total loss: 

0.44914

 | time: 29.440s


| Adam | epoch: 005 | loss: 0.44914 - acc: 0.7968 -- iter: 07680/24500


Training Step: 1653  | total loss: 

0.44561

 | time: 29.697s


| Adam | epoch: 005 | loss: 0.44561 - acc: 0.7952 -- iter: 07744/24500


Training Step: 1654  | total loss: 

0.44145

 | time: 29.953s


| Adam | epoch: 005 | loss: 0.44145 - acc: 0.7938 -- iter: 07808/24500


Training Step: 1655  | total loss: 

0.43360

 | time: 30.203s


| Adam | epoch: 005 | loss: 0.43360 - acc: 0.8004 -- iter: 07872/24500


Training Step: 1656  | total loss: 

0.44044

 | time: 30.452s


| Adam | epoch: 005 | loss: 0.44044 - acc: 0.7969 -- iter: 07936/24500


Training Step: 1657  | total loss: 

0.43828

 | time: 30.686s


| Adam | epoch: 005 | loss: 0.43828 - acc: 0.8000 -- iter: 08000/24500


Training Step: 1658  | total loss: 

0.43869

 | time: 30.940s


| Adam | epoch: 005 | loss: 0.43869 - acc: 0.8044 -- iter: 08064/24500


Training Step: 1659  | total loss: 

0.43123

 | time: 31.178s


| Adam | epoch: 005 | loss: 0.43123 - acc: 0.8130 -- iter: 08128/24500


Training Step: 1660  | total loss: 

0.43960

 | time: 31.421s


| Adam | epoch: 005 | loss: 0.43960 - acc: 0.8083 -- iter: 08192/24500


Training Step: 1661  | total loss: 

0.43670

 | time: 31.665s


| Adam | epoch: 005 | loss: 0.43670 - acc: 0.8025 -- iter: 08256/24500


Training Step: 1662  | total loss: 

0.43978

 | time: 31.915s


| Adam | epoch: 005 | loss: 0.43978 - acc: 0.8019 -- iter: 08320/24500


Training Step: 1663  | total loss: 

0.44363

 | time: 32.162s


| Adam | epoch: 005 | loss: 0.44363 - acc: 0.7983 -- iter: 08384/24500


Training Step: 1664  | total loss: 

0.44970

 | time: 32.405s


| Adam | epoch: 005 | loss: 0.44970 - acc: 0.7919 -- iter: 08448/24500


Training Step: 1665  | total loss: 

0.45200

 | time: 32.652s


| Adam | epoch: 005 | loss: 0.45200 - acc: 0.7939 -- iter: 08512/24500


Training Step: 1666  | total loss: 

0.45693

 | time: 32.892s


| Adam | epoch: 005 | loss: 0.45693 - acc: 0.7895 -- iter: 08576/24500


Training Step: 1667  | total loss: 

0.45849

 | time: 33.134s


| Adam | epoch: 005 | loss: 0.45849 - acc: 0.7872 -- iter: 08640/24500


Training Step: 1668  | total loss: 

0.46138

 | time: 33.375s


| Adam | epoch: 005 | loss: 0.46138 - acc: 0.7881 -- iter: 08704/24500


Training Step: 1669  | total loss: 

0.46521

 | time: 33.610s


| Adam | epoch: 005 | loss: 0.46521 - acc: 0.7890 -- iter: 08768/24500


Training Step: 1670  | total loss: 

0.45901

 | time: 33.852s


| Adam | epoch: 005 | loss: 0.45901 - acc: 0.7851 -- iter: 08832/24500


Training Step: 1671  | total loss: 

0.44976

 | time: 34.093s


| Adam | epoch: 005 | loss: 0.44976 - acc: 0.7894 -- iter: 08896/24500


Training Step: 1672  | total loss: 

0.45653

 | time: 34.338s


| Adam | epoch: 005 | loss: 0.45653 - acc: 0.7870 -- iter: 08960/24500


Training Step: 1673  | total loss: 

0.45958

 | time: 34.583s


| Adam | epoch: 005 | loss: 0.45958 - acc: 0.7864 -- iter: 09024/24500


Training Step: 1674  | total loss: 

0.45750

 | time: 34.834s


| Adam | epoch: 005 | loss: 0.45750 - acc: 0.7859 -- iter: 09088/24500


Training Step: 1675  | total loss: 

0.45693

 | time: 35.080s


| Adam | epoch: 005 | loss: 0.45693 - acc: 0.7839 -- iter: 09152/24500


Training Step: 1676  | total loss: 

0.45288

 | time: 35.318s


| Adam | epoch: 005 | loss: 0.45288 - acc: 0.7899 -- iter: 09216/24500


Training Step: 1677  | total loss: 

0.45684

 | time: 35.554s


| Adam | epoch: 005 | loss: 0.45684 - acc: 0.7859 -- iter: 09280/24500


Training Step: 1678  | total loss: 

0.44952

 | time: 35.795s


| Adam | epoch: 005 | loss: 0.44952 - acc: 0.7932 -- iter: 09344/24500


Training Step: 1679  | total loss: 

0.46714

 | time: 36.027s


| Adam | epoch: 005 | loss: 0.46714 - acc: 0.7827 -- iter: 09408/24500


Training Step: 1680  | total loss: 

0.46504

 | time: 36.264s


| Adam | epoch: 005 | loss: 0.46504 - acc: 0.7794 -- iter: 09472/24500


Training Step: 1681  | total loss: 

0.46367

 | time: 36.507s


| Adam | epoch: 005 | loss: 0.46367 - acc: 0.7765 -- iter: 09536/24500


Training Step: 1682  | total loss: 

0.45019

 | time: 36.764s


| Adam | epoch: 005 | loss: 0.45019 - acc: 0.7863 -- iter: 09600/24500


Training Step: 1683  | total loss: 

0.44844

 | time: 37.015s


| Adam | epoch: 005 | loss: 0.44844 - acc: 0.7905 -- iter: 09664/24500


Training Step: 1684  | total loss: 

0.44528

 | time: 37.241s


| Adam | epoch: 005 | loss: 0.44528 - acc: 0.7896 -- iter: 09728/24500


Training Step: 1685  | total loss: 

0.43227

 | time: 37.482s


| Adam | epoch: 005 | loss: 0.43227 - acc: 0.7981 -- iter: 09792/24500


Training Step: 1686  | total loss: 

0.42329

 | time: 37.737s


| Adam | epoch: 005 | loss: 0.42329 - acc: 0.8058 -- iter: 09856/24500


Training Step: 1687  | total loss: 

0.44277

 | time: 37.985s


| Adam | epoch: 005 | loss: 0.44277 - acc: 0.7955 -- iter: 09920/24500


Training Step: 1688  | total loss: 

0.43722

 | time: 38.223s


| Adam | epoch: 005 | loss: 0.43722 - acc: 0.8035 -- iter: 09984/24500


Training Step: 1689  | total loss: 

0.46151

 | time: 38.469s


| Adam | epoch: 005 | loss: 0.46151 - acc: 0.7934 -- iter: 10048/24500


Training Step: 1690  | total loss: 

0.46473

 | time: 38.714s


| Adam | epoch: 005 | loss: 0.46473 - acc: 0.7797 -- iter: 10112/24500


Training Step: 1691  | total loss: 

0.47493

 | time: 38.961s


| Adam | epoch: 005 | loss: 0.47493 - acc: 0.7783 -- iter: 10176/24500


Training Step: 1692  | total loss: 

0.47646

 | time: 39.215s


| Adam | epoch: 005 | loss: 0.47646 - acc: 0.7817 -- iter: 10240/24500


Training Step: 1693  | total loss: 

0.47403

 | time: 39.456s


| Adam | epoch: 005 | loss: 0.47403 - acc: 0.7848 -- iter: 10304/24500


Training Step: 1694  | total loss: 

0.45884

 | time: 39.706s


| Adam | epoch: 005 | loss: 0.45884 - acc: 0.7970 -- iter: 10368/24500


Training Step: 1695  | total loss: 

0.45521

 | time: 39.952s


| Adam | epoch: 005 | loss: 0.45521 - acc: 0.8001 -- iter: 10432/24500


Training Step: 1696  | total loss: 

0.47230

 | time: 40.194s


| Adam | epoch: 005 | loss: 0.47230 - acc: 0.7873 -- iter: 10496/24500


Training Step: 1697  | total loss: 

0.46901

 | time: 40.429s


| Adam | epoch: 005 | loss: 0.46901 - acc: 0.7882 -- iter: 10560/24500


Training Step: 1698  | total loss: 

0.46312

 | time: 40.666s


| Adam | epoch: 005 | loss: 0.46312 - acc: 0.7922 -- iter: 10624/24500


Training Step: 1699  | total loss: 

0.47033

 | time: 40.916s


| Adam | epoch: 005 | loss: 0.47033 - acc: 0.7833 -- iter: 10688/24500


Training Step: 1700  | total loss: 

0.47082

 | time: 41.157s


| Adam | epoch: 005 | loss: 0.47082 - acc: 0.7862 -- iter: 10752/24500


Training Step: 1701  | total loss: 

0.46793

 | time: 41.395s


| Adam | epoch: 005 | loss: 0.46793 - acc: 0.7920 -- iter: 10816/24500


Training Step: 1702  | total loss: 

0.47200

 | time: 41.639s


| Adam | epoch: 005 | loss: 0.47200 - acc: 0.7862 -- iter: 10880/24500


Training Step: 1703  | total loss: 

0.48774

 | time: 41.882s


| Adam | epoch: 005 | loss: 0.48774 - acc: 0.7732 -- iter: 10944/24500


Training Step: 1704  | total loss: 

0.48565

 | time: 42.118s


| Adam | epoch: 005 | loss: 0.48565 - acc: 0.7740 -- iter: 11008/24500


Training Step: 1705  | total loss: 

0.48681

 | time: 42.358s


| Adam | epoch: 005 | loss: 0.48681 - acc: 0.7732 -- iter: 11072/24500


Training Step: 1706  | total loss: 

0.48287

 | time: 42.607s


| Adam | epoch: 005 | loss: 0.48287 - acc: 0.7787 -- iter: 11136/24500


Training Step: 1707  | total loss: 

0.47702

 | time: 42.857s


| Adam | epoch: 005 | loss: 0.47702 - acc: 0.7867 -- iter: 11200/24500


Training Step: 1708  | total loss: 

0.48094

 | time: 43.110s


| Adam | epoch: 005 | loss: 0.48094 - acc: 0.7799 -- iter: 11264/24500


Training Step: 1709  | total loss: 

0.47891

 | time: 43.354s


| Adam | epoch: 005 | loss: 0.47891 - acc: 0.7848 -- iter: 11328/24500


Training Step: 1710  | total loss: 

0.47832

 | time: 43.606s


| Adam | epoch: 005 | loss: 0.47832 - acc: 0.7844 -- iter: 11392/24500


Training Step: 1711  | total loss: 

0.47337

 | time: 43.857s


| Adam | epoch: 005 | loss: 0.47337 - acc: 0.7888 -- iter: 11456/24500


Training Step: 1712  | total loss: 

0.46920

 | time: 44.096s


| Adam | epoch: 005 | loss: 0.46920 - acc: 0.7958 -- iter: 11520/24500


Training Step: 1713  | total loss: 

0.45635

 | time: 44.347s


| Adam | epoch: 005 | loss: 0.45635 - acc: 0.8038 -- iter: 11584/24500


Training Step: 1714  | total loss: 

0.45788

 | time: 44.590s


| Adam | epoch: 005 | loss: 0.45788 - acc: 0.8046 -- iter: 11648/24500


Training Step: 1715  | total loss: 

0.46222

 | time: 44.832s


| Adam | epoch: 005 | loss: 0.46222 - acc: 0.7960 -- iter: 11712/24500


Training Step: 1716  | total loss: 

0.46789

 | time: 45.085s


| Adam | epoch: 005 | loss: 0.46789 - acc: 0.7899 -- iter: 11776/24500


Training Step: 1717  | total loss: 

0.49590

 | time: 45.326s


| Adam | epoch: 005 | loss: 0.49590 - acc: 0.7765 -- iter: 11840/24500


Training Step: 1718  | total loss: 

0.48874

 | time: 45.563s


| Adam | epoch: 005 | loss: 0.48874 - acc: 0.7707 -- iter: 11904/24500


Training Step: 1719  | total loss: 

0.48389

 | time: 45.810s


| Adam | epoch: 005 | loss: 0.48389 - acc: 0.7687 -- iter: 11968/24500


Training Step: 1720  | total loss: 

0.47532

 | time: 46.053s


| Adam | epoch: 005 | loss: 0.47532 - acc: 0.7730 -- iter: 12032/24500


Training Step: 1721  | total loss: 

0.47518

 | time: 46.302s


| Adam | epoch: 005 | loss: 0.47518 - acc: 0.7754 -- iter: 12096/24500


Training Step: 1722  | total loss: 

0.46469

 | time: 46.534s


| Adam | epoch: 005 | loss: 0.46469 - acc: 0.7823 -- iter: 12160/24500


Training Step: 1723  | total loss: 

0.47172

 | time: 46.780s


| Adam | epoch: 005 | loss: 0.47172 - acc: 0.7790 -- iter: 12224/24500


Training Step: 1724  | total loss: 

0.46685

 | time: 47.030s


| Adam | epoch: 005 | loss: 0.46685 - acc: 0.7793 -- iter: 12288/24500


Training Step: 1725  | total loss: 

0.46824

 | time: 47.271s


| Adam | epoch: 005 | loss: 0.46824 - acc: 0.7810 -- iter: 12352/24500


Training Step: 1726  | total loss: 

0.47542

 | time: 47.514s


| Adam | epoch: 005 | loss: 0.47542 - acc: 0.7810 -- iter: 12416/24500


Training Step: 1727  | total loss: 

0.46436

 | time: 47.758s


| Adam | epoch: 005 | loss: 0.46436 - acc: 0.7826 -- iter: 12480/24500


Training Step: 1728  | total loss: 

0.46553

 | time: 47.997s


| Adam | epoch: 005 | loss: 0.46553 - acc: 0.7841 -- iter: 12544/24500


Training Step: 1729  | total loss: 

0.46641

 | time: 48.245s


| Adam | epoch: 005 | loss: 0.46641 - acc: 0.7853 -- iter: 12608/24500


Training Step: 1730  | total loss: 

0.47074

 | time: 48.477s


| Adam | epoch: 005 | loss: 0.47074 - acc: 0.7849 -- iter: 12672/24500


Training Step: 1731  | total loss: 

0.48516

 | time: 48.719s


| Adam | epoch: 005 | loss: 0.48516 - acc: 0.7799 -- iter: 12736/24500


Training Step: 1732  | total loss: 

0.48855

 | time: 48.963s


| Adam | epoch: 005 | loss: 0.48855 - acc: 0.7722 -- iter: 12800/24500


Training Step: 1733  | total loss: 

0.48449

 | time: 49.219s


| Adam | epoch: 005 | loss: 0.48449 - acc: 0.7747 -- iter: 12864/24500


Training Step: 1734  | total loss: 

0.48948

 | time: 49.447s


| Adam | epoch: 005 | loss: 0.48948 - acc: 0.7644 -- iter: 12928/24500


Training Step: 1735  | total loss: 

0.49240

 | time: 49.691s


| Adam | epoch: 005 | loss: 0.49240 - acc: 0.7567 -- iter: 12992/24500


Training Step: 1736  | total loss: 

0.49005

 | time: 49.935s


| Adam | epoch: 005 | loss: 0.49005 - acc: 0.7576 -- iter: 13056/24500


Training Step: 1737  | total loss: 

0.48483

 | time: 50.174s


| Adam | epoch: 005 | loss: 0.48483 - acc: 0.7662 -- iter: 13120/24500


Training Step: 1738  | total loss: 

0.49219

 | time: 50.415s


| Adam | epoch: 005 | loss: 0.49219 - acc: 0.7552 -- iter: 13184/24500


Training Step: 1739  | total loss: 

0.48722

 | time: 50.660s


| Adam | epoch: 005 | loss: 0.48722 - acc: 0.7578 -- iter: 13248/24500


Training Step: 1740  | total loss: 

0.48552

 | time: 50.919s


| Adam | epoch: 005 | loss: 0.48552 - acc: 0.7523 -- iter: 13312/24500


Training Step: 1741  | total loss: 

0.47570

 | time: 51.163s


| Adam | epoch: 005 | loss: 0.47570 - acc: 0.7568 -- iter: 13376/24500


Training Step: 1742  | total loss: 

0.46967

 | time: 51.409s


| Adam | epoch: 005 | loss: 0.46967 - acc: 0.7655 -- iter: 13440/24500


Training Step: 1743  | total loss: 

0.47257

 | time: 51.646s


| Adam | epoch: 005 | loss: 0.47257 - acc: 0.7671 -- iter: 13504/24500


Training Step: 1744  | total loss: 

0.45790

 | time: 51.896s


| Adam | epoch: 005 | loss: 0.45790 - acc: 0.7857 -- iter: 13568/24500


Training Step: 1745  | total loss: 

0.44391

 | time: 52.133s


| Adam | epoch: 005 | loss: 0.44391 - acc: 0.7946 -- iter: 13632/24500


Training Step: 1746  | total loss: 

0.44025

 | time: 52.382s


| Adam | epoch: 005 | loss: 0.44025 - acc: 0.7995 -- iter: 13696/24500


Training Step: 1747  | total loss: 

0.43598

 | time: 52.627s


| Adam | epoch: 005 | loss: 0.43598 - acc: 0.7977 -- iter: 13760/24500


Training Step: 1748  | total loss: 

0.43639

 | time: 52.869s


| Adam | epoch: 005 | loss: 0.43639 - acc: 0.7914 -- iter: 13824/24500


Training Step: 1749  | total loss: 

0.43108

 | time: 53.119s


| Adam | epoch: 005 | loss: 0.43108 - acc: 0.7950 -- iter: 13888/24500


Training Step: 1750  | total loss: 

0.44994

 | time: 53.357s


| Adam | epoch: 005 | loss: 0.44994 - acc: 0.7858 -- iter: 13952/24500


Training Step: 1751  | total loss: 

0.45522

 | time: 53.589s


| Adam | epoch: 005 | loss: 0.45522 - acc: 0.7854 -- iter: 14016/24500


Training Step: 1752  | total loss: 

0.46904

 | time: 53.828s


| Adam | epoch: 005 | loss: 0.46904 - acc: 0.7850 -- iter: 14080/24500


Training Step: 1753  | total loss: 

0.45979

 | time: 54.096s


| Adam | epoch: 005 | loss: 0.45979 - acc: 0.7877 -- iter: 14144/24500


Training Step: 1754  | total loss: 

0.46703

 | time: 54.336s


| Adam | epoch: 005 | loss: 0.46703 - acc: 0.7824 -- iter: 14208/24500


Training Step: 1755  | total loss: 

0.46135

 | time: 54.569s


| Adam | epoch: 005 | loss: 0.46135 - acc: 0.7838 -- iter: 14272/24500


Training Step: 1756  | total loss: 

0.46196

 | time: 54.818s


| Adam | epoch: 005 | loss: 0.46196 - acc: 0.7851 -- iter: 14336/24500


Training Step: 1757  | total loss: 

0.45755

 | time: 55.071s


| Adam | epoch: 005 | loss: 0.45755 - acc: 0.7848 -- iter: 14400/24500


Training Step: 1758  | total loss: 

0.45624

 | time: 55.310s


| Adam | epoch: 005 | loss: 0.45624 - acc: 0.7860 -- iter: 14464/24500


Training Step: 1759  | total loss: 

0.45894

 | time: 55.557s


| Adam | epoch: 005 | loss: 0.45894 - acc: 0.7855 -- iter: 14528/24500


Training Step: 1760  | total loss: 

0.46807

 | time: 55.806s


| Adam | epoch: 005 | loss: 0.46807 - acc: 0.7773 -- iter: 14592/24500


Training Step: 1761  | total loss: 

0.46519

 | time: 56.042s


| Adam | epoch: 005 | loss: 0.46519 - acc: 0.7823 -- iter: 14656/24500


Training Step: 1762  | total loss: 

0.46288

 | time: 56.293s


| Adam | epoch: 005 | loss: 0.46288 - acc: 0.7854 -- iter: 14720/24500


Training Step: 1763  | total loss: 

0.45427

 | time: 56.533s


| Adam | epoch: 005 | loss: 0.45427 - acc: 0.7865 -- iter: 14784/24500


Training Step: 1764  | total loss: 

0.45213

 | time: 56.776s


| Adam | epoch: 005 | loss: 0.45213 - acc: 0.7875 -- iter: 14848/24500


Training Step: 1765  | total loss: 

0.46706

 | time: 57.020s


| Adam | epoch: 005 | loss: 0.46706 - acc: 0.7791 -- iter: 14912/24500


Training Step: 1766  | total loss: 

0.46002

 | time: 57.266s


| Adam | epoch: 005 | loss: 0.46002 - acc: 0.7840 -- iter: 14976/24500


Training Step: 1767  | total loss: 

0.45860

 | time: 57.516s


| Adam | epoch: 005 | loss: 0.45860 - acc: 0.7853 -- iter: 15040/24500


Training Step: 1768  | total loss: 

0.46162

 | time: 57.762s


| Adam | epoch: 005 | loss: 0.46162 - acc: 0.7833 -- iter: 15104/24500


Training Step: 1769  | total loss: 

0.46884

 | time: 58.008s


| Adam | epoch: 005 | loss: 0.46884 - acc: 0.7816 -- iter: 15168/24500


Training Step: 1770  | total loss: 

0.47458

 | time: 58.251s


| Adam | epoch: 005 | loss: 0.47458 - acc: 0.7768 -- iter: 15232/24500


Training Step: 1771  | total loss: 

0.46826

 | time: 58.499s


| Adam | epoch: 005 | loss: 0.46826 - acc: 0.7820 -- iter: 15296/24500


Training Step: 1772  | total loss: 

0.47320

 | time: 58.740s


| Adam | epoch: 005 | loss: 0.47320 - acc: 0.7835 -- iter: 15360/24500


Training Step: 1773  | total loss: 

0.46978

 | time: 58.982s


| Adam | epoch: 005 | loss: 0.46978 - acc: 0.7785 -- iter: 15424/24500


Training Step: 1774  | total loss: 

0.47954

 | time: 59.231s


| Adam | epoch: 005 | loss: 0.47954 - acc: 0.7773 -- iter: 15488/24500


Training Step: 1775  | total loss: 

0.48359

 | time: 59.465s


| Adam | epoch: 005 | loss: 0.48359 - acc: 0.7714 -- iter: 15552/24500


Training Step: 1776  | total loss: 

0.48592

 | time: 59.699s


| Adam | epoch: 005 | loss: 0.48592 - acc: 0.7740 -- iter: 15616/24500


Training Step: 1777  | total loss: 

0.48089

 | time: 59.938s


| Adam | epoch: 005 | loss: 0.48089 - acc: 0.7778 -- iter: 15680/24500


Training Step: 1778  | total loss: 

0.48116

 | time: 60.192s


| Adam | epoch: 005 | loss: 0.48116 - acc: 0.7766 -- iter: 15744/24500


Training Step: 1779  | total loss: 

0.47684

 | time: 60.436s


| Adam | epoch: 005 | loss: 0.47684 - acc: 0.7802 -- iter: 15808/24500


Training Step: 1780  | total loss: 

0.47186

 | time: 60.679s


| Adam | epoch: 005 | loss: 0.47186 - acc: 0.7834 -- iter: 15872/24500


Training Step: 1781  | total loss: 

0.46223

 | time: 60.922s


| Adam | epoch: 005 | loss: 0.46223 - acc: 0.7879 -- iter: 15936/24500


Training Step: 1782  | total loss: 

0.46351

 | time: 61.175s


| Adam | epoch: 005 | loss: 0.46351 - acc: 0.7825 -- iter: 16000/24500


Training Step: 1783  | total loss: 

0.47513

 | time: 61.417s


| Adam | epoch: 005 | loss: 0.47513 - acc: 0.7746 -- iter: 16064/24500


Training Step: 1784  | total loss: 

0.47134

 | time: 61.663s


| Adam | epoch: 005 | loss: 0.47134 - acc: 0.7753 -- iter: 16128/24500


Training Step: 1785  | total loss: 

0.47566

 | time: 61.899s


| Adam | epoch: 005 | loss: 0.47566 - acc: 0.7696 -- iter: 16192/24500


Training Step: 1786  | total loss: 

0.47462

 | time: 62.137s


| Adam | epoch: 005 | loss: 0.47462 - acc: 0.7630 -- iter: 16256/24500


Training Step: 1787  | total loss: 

0.46484

 | time: 62.376s


| Adam | epoch: 005 | loss: 0.46484 - acc: 0.7742 -- iter: 16320/24500


Training Step: 1788  | total loss: 

0.47018

 | time: 62.614s


| Adam | epoch: 005 | loss: 0.47018 - acc: 0.7686 -- iter: 16384/24500


Training Step: 1789  | total loss: 

0.46939

 | time: 62.854s


| Adam | epoch: 005 | loss: 0.46939 - acc: 0.7699 -- iter: 16448/24500


Training Step: 1790  | total loss: 

0.46751

 | time: 63.093s


| Adam | epoch: 005 | loss: 0.46751 - acc: 0.7726 -- iter: 16512/24500


Training Step: 1791  | total loss: 

0.45742

 | time: 63.336s


| Adam | epoch: 005 | loss: 0.45742 - acc: 0.7813 -- iter: 16576/24500


Training Step: 1792  | total loss: 

0.45531

 | time: 63.584s


| Adam | epoch: 005 | loss: 0.45531 - acc: 0.7797 -- iter: 16640/24500


Training Step: 1793  | total loss: 

0.45776

 | time: 63.824s


| Adam | epoch: 005 | loss: 0.45776 - acc: 0.7783 -- iter: 16704/24500


Training Step: 1794  | total loss: 

0.45517

 | time: 64.071s


| Adam | epoch: 005 | loss: 0.45517 - acc: 0.7801 -- iter: 16768/24500


Training Step: 1795  | total loss: 

0.45759

 | time: 64.324s


| Adam | epoch: 005 | loss: 0.45759 - acc: 0.7803 -- iter: 16832/24500


Training Step: 1796  | total loss: 

0.46236

 | time: 64.569s


| Adam | epoch: 005 | loss: 0.46236 - acc: 0.7819 -- iter: 16896/24500


Training Step: 1797  | total loss: 

0.46426

 | time: 64.814s


| Adam | epoch: 005 | loss: 0.46426 - acc: 0.7881 -- iter: 16960/24500


Training Step: 1798  | total loss: 

0.47616

 | time: 65.048s


| Adam | epoch: 005 | loss: 0.47616 - acc: 0.7812 -- iter: 17024/24500


Training Step: 1799  | total loss: 

0.46505

 | time: 65.301s


| Adam | epoch: 005 | loss: 0.46505 - acc: 0.7859 -- iter: 17088/24500


Training Step: 1800  | total loss: 

0.45724

 | time: 65.541s


| Adam | epoch: 005 | loss: 0.45724 - acc: 0.7917 -- iter: 17152/24500


Training Step: 1801  | total loss: 

0.46205

 | time: 65.789s


| Adam | epoch: 005 | loss: 0.46205 - acc: 0.7844 -- iter: 17216/24500


Training Step: 1802  | total loss: 

0.45829

 | time: 66.037s


| Adam | epoch: 005 | loss: 0.45829 - acc: 0.7856 -- iter: 17280/24500


Training Step: 1803  | total loss: 

0.45855

 | time: 66.279s


| Adam | epoch: 005 | loss: 0.45855 - acc: 0.7836 -- iter: 17344/24500


Training Step: 1804  | total loss: 

0.47674

 | time: 66.534s


| Adam | epoch: 005 | loss: 0.47674 - acc: 0.7803 -- iter: 17408/24500


Training Step: 1805  | total loss: 

0.47211

 | time: 66.780s


| Adam | epoch: 005 | loss: 0.47211 - acc: 0.7804 -- iter: 17472/24500


Training Step: 1806  | total loss: 

0.47332

 | time: 67.034s


| Adam | epoch: 005 | loss: 0.47332 - acc: 0.7789 -- iter: 17536/24500


Training Step: 1807  | total loss: 

0.45926

 | time: 67.281s


| Adam | epoch: 005 | loss: 0.45926 - acc: 0.7901 -- iter: 17600/24500


Training Step: 1808  | total loss: 

0.45463

 | time: 67.534s


| Adam | epoch: 005 | loss: 0.45463 - acc: 0.7907 -- iter: 17664/24500


Training Step: 1809  | total loss: 

0.45614

 | time: 67.776s


| Adam | epoch: 005 | loss: 0.45614 - acc: 0.7929 -- iter: 17728/24500


Training Step: 1810  | total loss: 

0.44384

 | time: 68.023s


| Adam | epoch: 005 | loss: 0.44384 - acc: 0.7996 -- iter: 17792/24500


Training Step: 1811  | total loss: 

0.44685

 | time: 68.268s


| Adam | epoch: 005 | loss: 0.44685 - acc: 0.7993 -- iter: 17856/24500


Training Step: 1812  | total loss: 

0.44376

 | time: 68.503s


| Adam | epoch: 005 | loss: 0.44376 - acc: 0.8037 -- iter: 17920/24500


Training Step: 1813  | total loss: 

0.44263

 | time: 68.760s


| Adam | epoch: 005 | loss: 0.44263 - acc: 0.8046 -- iter: 17984/24500


Training Step: 1814  | total loss: 

0.44261

 | time: 68.991s


| Adam | epoch: 005 | loss: 0.44261 - acc: 0.8007 -- iter: 18048/24500


Training Step: 1815  | total loss: 

0.44699

 | time: 69.232s


| Adam | epoch: 005 | loss: 0.44699 - acc: 0.8003 -- iter: 18112/24500


Training Step: 1816  | total loss: 

0.43890

 | time: 69.484s


| Adam | epoch: 005 | loss: 0.43890 - acc: 0.8031 -- iter: 18176/24500


Training Step: 1817  | total loss: 

0.42386

 | time: 69.721s


| Adam | epoch: 005 | loss: 0.42386 - acc: 0.8134 -- iter: 18240/24500


Training Step: 1818  | total loss: 

0.42871

 | time: 69.964s


| Adam | epoch: 005 | loss: 0.42871 - acc: 0.8149 -- iter: 18304/24500


Training Step: 1819  | total loss: 

0.44157

 | time: 70.193s


| Adam | epoch: 005 | loss: 0.44157 - acc: 0.8068 -- iter: 18368/24500


Training Step: 1820  | total loss: 

0.44266

 | time: 70.433s


| Adam | epoch: 005 | loss: 0.44266 - acc: 0.8058 -- iter: 18432/24500


Training Step: 1821  | total loss: 

0.44658

 | time: 70.678s


| Adam | epoch: 005 | loss: 0.44658 - acc: 0.8065 -- iter: 18496/24500


Training Step: 1822  | total loss: 

0.45278

 | time: 70.927s


| Adam | epoch: 005 | loss: 0.45278 - acc: 0.8040 -- iter: 18560/24500


Training Step: 1823  | total loss: 

0.44484

 | time: 71.170s


| Adam | epoch: 005 | loss: 0.44484 - acc: 0.8080 -- iter: 18624/24500


Training Step: 1824  | total loss: 

0.44406

 | time: 71.418s


| Adam | epoch: 005 | loss: 0.44406 - acc: 0.8084 -- iter: 18688/24500


Training Step: 1825  | total loss: 

0.44213

 | time: 71.665s


| Adam | epoch: 005 | loss: 0.44213 - acc: 0.8119 -- iter: 18752/24500


Training Step: 1826  | total loss: 

0.44585

 | time: 71.915s


| Adam | epoch: 005 | loss: 0.44585 - acc: 0.8073 -- iter: 18816/24500


Training Step: 1827  | total loss: 

0.45044

 | time: 72.141s


| Adam | epoch: 005 | loss: 0.45044 - acc: 0.8031 -- iter: 18880/24500


Training Step: 1828  | total loss: 

0.44781

 | time: 72.386s


| Adam | epoch: 005 | loss: 0.44781 - acc: 0.8010 -- iter: 18944/24500


Training Step: 1829  | total loss: 

0.44080

 | time: 72.625s


| Adam | epoch: 005 | loss: 0.44080 - acc: 0.8052 -- iter: 19008/24500


Training Step: 1830  | total loss: 

0.44330

 | time: 72.870s


| Adam | epoch: 005 | loss: 0.44330 - acc: 0.8028 -- iter: 19072/24500


Training Step: 1831  | total loss: 

0.45430

 | time: 73.107s


| Adam | epoch: 005 | loss: 0.45430 - acc: 0.7929 -- iter: 19136/24500


Training Step: 1832  | total loss: 

0.45283

 | time: 73.345s


| Adam | epoch: 005 | loss: 0.45283 - acc: 0.7964 -- iter: 19200/24500


Training Step: 1833  | total loss: 

0.45396

 | time: 73.599s


| Adam | epoch: 005 | loss: 0.45396 - acc: 0.7980 -- iter: 19264/24500


Training Step: 1834  | total loss: 

0.45924

 | time: 73.836s


| Adam | epoch: 005 | loss: 0.45924 - acc: 0.7901 -- iter: 19328/24500


Training Step: 1835  | total loss: 

0.45814

 | time: 74.076s


| Adam | epoch: 005 | loss: 0.45814 - acc: 0.7892 -- iter: 19392/24500


Training Step: 1836  | total loss: 

0.45653

 | time: 74.326s


| Adam | epoch: 005 | loss: 0.45653 - acc: 0.7900 -- iter: 19456/24500


Training Step: 1837  | total loss: 

0.44495

 | time: 74.573s


| Adam | epoch: 005 | loss: 0.44495 - acc: 0.7969 -- iter: 19520/24500


Training Step: 1838  | total loss: 

0.43961

 | time: 74.817s


| Adam | epoch: 005 | loss: 0.43961 - acc: 0.7985 -- iter: 19584/24500


Training Step: 1839  | total loss: 

0.43675

 | time: 75.065s


| Adam | epoch: 005 | loss: 0.43675 - acc: 0.8014 -- iter: 19648/24500


Training Step: 1840  | total loss: 

0.43445

 | time: 75.322s


| Adam | epoch: 005 | loss: 0.43445 - acc: 0.8041 -- iter: 19712/24500


Training Step: 1841  | total loss: 

0.43161

 | time: 75.557s


| Adam | epoch: 005 | loss: 0.43161 - acc: 0.8034 -- iter: 19776/24500


Training Step: 1842  | total loss: 

0.43374

 | time: 75.791s


| Adam | epoch: 005 | loss: 0.43374 - acc: 0.8043 -- iter: 19840/24500


Training Step: 1843  | total loss: 

0.43244

 | time: 76.036s


| Adam | epoch: 005 | loss: 0.43244 - acc: 0.8067 -- iter: 19904/24500


Training Step: 1844  | total loss: 

0.45318

 | time: 76.278s


| Adam | epoch: 005 | loss: 0.45318 - acc: 0.7932 -- iter: 19968/24500


Training Step: 1845  | total loss: 

0.45699

 | time: 76.528s


| Adam | epoch: 005 | loss: 0.45699 - acc: 0.7826 -- iter: 20032/24500


Training Step: 1846  | total loss: 

0.45668

 | time: 76.765s


| Adam | epoch: 005 | loss: 0.45668 - acc: 0.7825 -- iter: 20096/24500


Training Step: 1847  | total loss: 

0.47369

 | time: 77.008s


| Adam | epoch: 005 | loss: 0.47369 - acc: 0.7824 -- iter: 20160/24500


Training Step: 1848  | total loss: 

0.46514

 | time: 77.248s


| Adam | epoch: 005 | loss: 0.46514 - acc: 0.7885 -- iter: 20224/24500


Training Step: 1849  | total loss: 

0.47670

 | time: 77.491s


| Adam | epoch: 005 | loss: 0.47670 - acc: 0.7831 -- iter: 20288/24500


Training Step: 1850  | total loss: 

0.48910

 | time: 77.727s


| Adam | epoch: 005 | loss: 0.48910 - acc: 0.7735 -- iter: 20352/24500


Training Step: 1851  | total loss: 

0.50360

 | time: 77.964s


| Adam | epoch: 005 | loss: 0.50360 - acc: 0.7665 -- iter: 20416/24500


Training Step: 1852  | total loss: 

0.49569

 | time: 78.205s


| Adam | epoch: 005 | loss: 0.49569 - acc: 0.7711 -- iter: 20480/24500


Training Step: 1853  | total loss: 

0.48861

 | time: 78.456s


| Adam | epoch: 005 | loss: 0.48861 - acc: 0.7721 -- iter: 20544/24500


Training Step: 1854  | total loss: 

0.48031

 | time: 78.706s


| Adam | epoch: 005 | loss: 0.48031 - acc: 0.7746 -- iter: 20608/24500


Training Step: 1855  | total loss: 

0.48823

 | time: 78.952s


| Adam | epoch: 005 | loss: 0.48823 - acc: 0.7690 -- iter: 20672/24500


Training Step: 1856  | total loss: 

0.49446

 | time: 79.196s


| Adam | epoch: 005 | loss: 0.49446 - acc: 0.7640 -- iter: 20736/24500


Training Step: 1857  | total loss: 

0.48774

 | time: 79.442s


| Adam | epoch: 005 | loss: 0.48774 - acc: 0.7720 -- iter: 20800/24500


Training Step: 1858  | total loss: 

0.48121

 | time: 79.682s


| Adam | epoch: 005 | loss: 0.48121 - acc: 0.7729 -- iter: 20864/24500


Training Step: 1859  | total loss: 

0.47926

 | time: 79.926s


| Adam | epoch: 005 | loss: 0.47926 - acc: 0.7737 -- iter: 20928/24500


Training Step: 1860  | total loss: 

0.47992

 | time: 80.165s


| Adam | epoch: 005 | loss: 0.47992 - acc: 0.7760 -- iter: 20992/24500


Training Step: 1861  | total loss: 

0.47771

 | time: 80.420s


| Adam | epoch: 005 | loss: 0.47771 - acc: 0.7750 -- iter: 21056/24500


Training Step: 1862  | total loss: 

0.47650

 | time: 80.658s


| Adam | epoch: 005 | loss: 0.47650 - acc: 0.7725 -- iter: 21120/24500


Training Step: 1863  | total loss: 

0.46781

 | time: 80.896s


| Adam | epoch: 005 | loss: 0.46781 - acc: 0.7812 -- iter: 21184/24500


Training Step: 1864  | total loss: 

0.46305

 | time: 81.130s


| Adam | epoch: 005 | loss: 0.46305 - acc: 0.7890 -- iter: 21248/24500


Training Step: 1865  | total loss: 

0.45822

 | time: 81.378s


| Adam | epoch: 005 | loss: 0.45822 - acc: 0.7929 -- iter: 21312/24500


Training Step: 1866  | total loss: 

0.44867

 | time: 81.622s


| Adam | epoch: 005 | loss: 0.44867 - acc: 0.8027 -- iter: 21376/24500


Training Step: 1867  | total loss: 

0.43926

 | time: 81.869s


| Adam | epoch: 005 | loss: 0.43926 - acc: 0.8084 -- iter: 21440/24500


Training Step: 1868  | total loss: 

0.43827

 | time: 82.119s


| Adam | epoch: 005 | loss: 0.43827 - acc: 0.8056 -- iter: 21504/24500


Training Step: 1869  | total loss: 

0.44748

 | time: 82.356s


| Adam | epoch: 005 | loss: 0.44748 - acc: 0.8016 -- iter: 21568/24500


Training Step: 1870  | total loss: 

0.44906

 | time: 82.601s


| Adam | epoch: 005 | loss: 0.44906 - acc: 0.8027 -- iter: 21632/24500


Training Step: 1871  | total loss: 

0.44361

 | time: 82.844s


| Adam | epoch: 005 | loss: 0.44361 - acc: 0.8037 -- iter: 21696/24500


Training Step: 1872  | total loss: 

0.44502

 | time: 83.089s


| Adam | epoch: 005 | loss: 0.44502 - acc: 0.7983 -- iter: 21760/24500


Training Step: 1873  | total loss: 

0.45786

 | time: 83.330s


| Adam | epoch: 005 | loss: 0.45786 - acc: 0.7904 -- iter: 21824/24500


Training Step: 1874  | total loss: 

0.48606

 | time: 83.576s


| Adam | epoch: 005 | loss: 0.48606 - acc: 0.7832 -- iter: 21888/24500


Training Step: 1875  | total loss: 

0.48483

 | time: 83.825s


| Adam | epoch: 005 | loss: 0.48483 - acc: 0.7846 -- iter: 21952/24500


Training Step: 1876  | total loss: 

0.48320

 | time: 84.063s


| Adam | epoch: 005 | loss: 0.48320 - acc: 0.7858 -- iter: 22016/24500


Training Step: 1877  | total loss: 

0.50611

 | time: 84.303s


| Adam | epoch: 005 | loss: 0.50611 - acc: 0.7650 -- iter: 22080/24500


Training Step: 1878  | total loss: 

0.49635

 | time: 84.549s


| Adam | epoch: 005 | loss: 0.49635 - acc: 0.7682 -- iter: 22144/24500


Training Step: 1879  | total loss: 

0.49215

 | time: 84.798s


| Adam | epoch: 005 | loss: 0.49215 - acc: 0.7727 -- iter: 22208/24500


Training Step: 1880  | total loss: 

0.48209

 | time: 85.040s


| Adam | epoch: 005 | loss: 0.48209 - acc: 0.7813 -- iter: 22272/24500


Training Step: 1881  | total loss: 

0.48033

 | time: 85.281s


| Adam | epoch: 005 | loss: 0.48033 - acc: 0.7782 -- iter: 22336/24500


Training Step: 1882  | total loss: 

0.47457

 | time: 85.537s


| Adam | epoch: 005 | loss: 0.47457 - acc: 0.7863 -- iter: 22400/24500


Training Step: 1883  | total loss: 

0.47107

 | time: 85.781s


| Adam | epoch: 005 | loss: 0.47107 - acc: 0.7952 -- iter: 22464/24500


Training Step: 1884  | total loss: 

0.46722

 | time: 86.018s


| Adam | epoch: 005 | loss: 0.46722 - acc: 0.7953 -- iter: 22528/24500


Training Step: 1885  | total loss: 

0.46387

 | time: 86.262s


| Adam | epoch: 005 | loss: 0.46387 - acc: 0.8002 -- iter: 22592/24500


Training Step: 1886  | total loss: 

0.46336

 | time: 86.503s


| Adam | epoch: 005 | loss: 0.46336 - acc: 0.8030 -- iter: 22656/24500


Training Step: 1887  | total loss: 

0.46024

 | time: 86.751s


| Adam | epoch: 005 | loss: 0.46024 - acc: 0.7992 -- iter: 22720/24500


Training Step: 1888  | total loss: 

0.52590

 | time: 86.993s


| Adam | epoch: 005 | loss: 0.52590 - acc: 0.7693 -- iter: 22784/24500


Training Step: 1889  | total loss: 

0.50789

 | time: 87.238s


| Adam | epoch: 005 | loss: 0.50789 - acc: 0.7799 -- iter: 22848/24500


Training Step: 1890  | total loss: 

0.49846

 | time: 87.474s


| Adam | epoch: 005 | loss: 0.49846 - acc: 0.7832 -- iter: 22912/24500


Training Step: 1891  | total loss: 

0.49349

 | time: 87.722s


| Adam | epoch: 005 | loss: 0.49349 - acc: 0.7830 -- iter: 22976/24500


Training Step: 1892  | total loss: 

0.48099

 | time: 87.967s


| Adam | epoch: 005 | loss: 0.48099 - acc: 0.7875 -- iter: 23040/24500


Training Step: 1893  | total loss: 

0.48119

 | time: 88.203s


| Adam | epoch: 005 | loss: 0.48119 - acc: 0.7869 -- iter: 23104/24500


Training Step: 1894  | total loss: 

0.47601

 | time: 88.452s


| Adam | epoch: 005 | loss: 0.47601 - acc: 0.7894 -- iter: 23168/24500


Training Step: 1895  | total loss: 

0.46039

 | time: 88.694s


| Adam | epoch: 005 | loss: 0.46039 - acc: 0.7980 -- iter: 23232/24500


Training Step: 1896  | total loss: 

0.44673

 | time: 88.943s


| Adam | epoch: 005 | loss: 0.44673 - acc: 0.8057 -- iter: 23296/24500


Training Step: 1897  | total loss: 

0.44755

 | time: 89.188s


| Adam | epoch: 005 | loss: 0.44755 - acc: 0.8017 -- iter: 23360/24500


Training Step: 1898  | total loss: 

0.45161

 | time: 89.420s


| Adam | epoch: 005 | loss: 0.45161 - acc: 0.8012 -- iter: 23424/24500


Training Step: 1899  | total loss: 

0.44584

 | time: 89.664s


| Adam | epoch: 005 | loss: 0.44584 - acc: 0.8070 -- iter: 23488/24500


Training Step: 1900  | total loss: 

0.44089

 | time: 89.906s


| Adam | epoch: 005 | loss: 0.44089 - acc: 0.8091 -- iter: 23552/24500


Training Step: 1901  | total loss: 

0.43306

 | time: 90.149s


| Adam | epoch: 005 | loss: 0.43306 - acc: 0.8157 -- iter: 23616/24500


Training Step: 1902  | total loss: 

0.42165

 | time: 90.397s


| Adam | epoch: 005 | loss: 0.42165 - acc: 0.8170 -- iter: 23680/24500


Training Step: 1903  | total loss: 

0.42714

 | time: 90.645s


| Adam | epoch: 005 | loss: 0.42714 - acc: 0.8118 -- iter: 23744/24500


Training Step: 1904  | total loss: 

0.42407

 | time: 90.887s


| Adam | epoch: 005 | loss: 0.42407 - acc: 0.8166 -- iter: 23808/24500


Training Step: 1905  | total loss: 

0.43187

 | time: 91.132s


| Adam | epoch: 005 | loss: 0.43187 - acc: 0.8162 -- iter: 23872/24500


Training Step: 1906  | total loss: 

0.42290

 | time: 91.379s


| Adam | epoch: 005 | loss: 0.42290 - acc: 0.8205 -- iter: 23936/24500


Training Step: 1907  | total loss: 

0.42570

 | time: 91.622s


| Adam | epoch: 005 | loss: 0.42570 - acc: 0.8197 -- iter: 24000/24500


Training Step: 1908  | total loss: 

0.42377

 | time: 91.863s


| Adam | epoch: 005 | loss: 0.42377 - acc: 0.8205 -- iter: 24064/24500


Training Step: 1909  | total loss: 

0.41737

 | time: 92.103s


| Adam | epoch: 005 | loss: 0.41737 - acc: 0.8213 -- iter: 24128/24500


Training Step: 1910  | total loss: 

0.41759

 | time: 92.342s


| Adam | epoch: 005 | loss: 0.41759 - acc: 0.8204 -- iter: 24192/24500


Training Step: 1911  | total loss: 

0.43695

 | time: 92.586s


| Adam | epoch: 005 | loss: 0.43695 - acc: 0.8134 -- iter: 24256/24500


Training Step: 1912  | total loss: 

0.43739

 | time: 92.835s


| Adam | epoch: 005 | loss: 0.43739 - acc: 0.8055 -- iter: 24320/24500


Training Step: 1913  | total loss: 

0.43505

 | time: 93.073s


| Adam | epoch: 005 | loss: 0.43505 - acc: 0.8030 -- iter: 24384/24500


Training Step: 1914  | total loss: 

0.43297

 | time: 93.314s


| Adam | epoch: 005 | loss: 0.43297 - acc: 0.8056 -- iter: 24448/24500


Training Step: 1915  | total loss: 

0.42679

 | time: 94.568s


| Adam | epoch: 005 | loss: 0.42679 - acc: 0.8078 | val_loss: 0.48608 - val_acc: 0.7760 -- iter: 24500/24500
--


INFO:tensorflow:C:\Users\modak\Anaconda3\TensorFlow_test\dogs-vs-cats-4-layer-covnet is not in all_model_checkpoint_paths. Manually adding it.




In [8]:
import matplotlib.pyplot as plt

In [9]:
fig=plt.figure(figsize=(16, 16))

for num, data in enumerate(test_data[50:75]):
    img_num = data[1]
    img_data = data[0]

    y = fig.add_subplot(5, 5, num+1)
    orig = img_data
    data = img_data.reshape(IMG_SIZE, IMG_SIZE, 1)
    model_out = model.predict([data])[0]

    if np.argmax(model_out) == 1:
        str_label='Dog'
    else:
        str_label='Cat'

    y.imshow(orig, cmap='gray')
    plt.title(str_label)
    y.axes.get_xaxis().set_visible(False)
    y.axes.get_yaxis().set_visible(False)
# plt.show()
plt.savefig('%s-test-25.png' % MODEL_NAME)



NameError: name 'test_data' is not defined

<matplotlib.figure.Figure at 0x2257f67d940>