In [1]:
import matplotlib as mpl
import matplotlib.pyplot as plt
%matplotlib inline
import numpy as np
import sklearn
import pandas as pd
import os
import sys
import time
import tensorflow as tf

from tensorflow import keras

print(tf.__version__)
print(sys.version_info)
for module in mpl,np,pd,sklearn,tf,keras:
    print(module.__name__,module.__version__)

tf.test.is_gpu_available()

  _np_qint8 = np.dtype([("qint8", np.int8, 1)])
  _np_quint8 = np.dtype([("quint8", np.uint8, 1)])
  _np_qint16 = np.dtype([("qint16", np.int16, 1)])
  _np_quint16 = np.dtype([("quint16", np.uint16, 1)])
  _np_qint32 = np.dtype([("qint32", np.int32, 1)])
  np_resource = np.dtype([("resource", np.ubyte, 1)])


1.13.1
sys.version_info(major=3, minor=7, micro=4, releaselevel='final', serial=0)
matplotlib 3.1.2
numpy 1.18.1
pandas 0.25.3
sklearn 0.22.1
tensorflow 1.13.1
tensorflow._api.v1.keras 2.2.4-tf


False

In [2]:
fashion_mnist = keras.datasets.fashion_mnist
(x_train_all,y_train_all),(x_test, y_test) = fashion_mnist.load_data()
x_valid,x_train = x_train_all[:5000],x_train_all[5000:]
y_valid,y_train = y_train_all[:5000],y_train_all[5000:]

print(x_train.shape,y_train.shape)
print(x_valid.shape,y_valid.shape)
print(x_test.shape,y_test.shape)
print(np.max(x_train),np.min(x_train))

# 这里对label数据类型进行更改，
y_train = np.asarray(y_train,dtype = np.int64)
y_valid = np.asarray(y_valid,dtype = np.int64)
y_test = np.asarray(y_test,dtype = np.int64)

(55000, 28, 28) (55000,)
(5000, 28, 28) (5000,)
(10000, 28, 28) (10000,)
255 0


In [3]:
from sklearn.preprocessing import StandardScaler

scaler = StandardScaler()
# x_train:[None,28,28] -> [None,784]
x_train_scaled = scaler.fit_transform(
    x_train.astype(np.float32).reshape(-1,1)).reshape(-1,28*28)
x_valid_scaled = scaler.fit_transform(
    x_valid.astype(np.float32).reshape(-1,1)).reshape(-1,28*28)
x_test_scaled = scaler.fit_transform(
    x_test.astype(np.float32).reshape(-1,1)).reshape(-1,28*28)
print(np.max(x_train_scaled),np.min(x_train_scaled))

2.0231433 -0.8105136


In [4]:
def make_dataset(images,labels,epochs,batch_size,shuffle = True):
    dataset = tf.data.Dataset.from_tensor_slices((images,labels))
    if shuffle:
        dataset.shuffle(10000)
    dataset = dataset.repeat(epochs).batch(batch_size)
    return dataset

In [5]:
# 我们并不能像在2.0中那样通过eager模式来访问dataset
epochs = 10
batch_size = 20
dataset = make_dataset(x_train_scaled,y_train,
                       epochs = epochs,
                       batch_size = batch_size)
for data, label in dataset.take(1):
    print(data)
    print(label)

RuntimeError: dataset.__iter__() is only supported when eager execution is enabled.

In [10]:
# 那么要怎样才能在1.0中访问dataset呢
epochs = 10
batch_size = 20
dataset = make_dataset(x_train_scaled,y_train,
                       epochs = epochs,
                       batch_size = batch_size)
# 首先需要创建dataset_iter
# make_one_shot_iterator有下面这些特点:
# 1、自动初始化
# 2、不能被重新初始化；(make_initializable_iterator是可以重新被初始化的)
dataset_iter = dataset.make_one_shot_iterator()
x,y = dataset_iter.get_next() # 取出tensor
# 创建session来访问
with tf.Session() as sess:
    x_val,y_val = sess.run([x,y])
    print(x_val.shape)
    print(y_val.shape)

(20, 784)
(20,)


In [11]:
# 构建模型
hidden_units = [100,100]
class_num = 10 # 10分类

input_for_next_layer = x
# 隐藏层
for hidden_unit in hidden_units:
    input_for_next_layer = tf.layers.dense(input_for_next_layer,
                                           hidden_unit,
                                           activation=tf.nn.relu)
# 输出层
logits = tf.layers.dense(input_for_next_layer,
                         class_num)

# loss计算
# 1. 将最后一层的输出做softmax计算出prob(每种分类的概率)
# 2. labels -> one_hot 将标签进行one-hot编码
# 3. 计算loss：就是去概率最大的那个max_prob进行-log(max_prob)的计算
loss = tf.losses.sparse_softmax_cross_entropy(labels = y,
                                              logits = logits)

# 计算正确率accuracy
# 取出概率最大的那个位置的索引位置作为预测
prediction = tf.argmax(logits, 1)
correct_prediction = tf.equal(prediction,y) # 正确的为1，错误的为0
# 先将int值转为float类型然后在进行正确率的计算
accuracy = tf.reduce_mean(tf.cast(correct_prediction,tf.float64)) 

# 定义train_op,在训练的时候就是调用train_op
train_op = tf.train.AdamOptimizer(1e-3).minimize(loss)

In [12]:
print(x)
print(logits)

Tensor("IteratorGetNext_1:0", shape=(?, 784), dtype=float32)
Tensor("dense_5/BiasAdd:0", shape=(?, 10), dtype=float32)


In [13]:
# 模型训练
init = tf.global_variables_initializer()
train_steps_per_epoch = x_train_scaled.shape[0] // batch_size

with tf.Session() as sess:
    sess.run(init)
    for epoch in range(epochs):
        for step in range(train_steps_per_epoch):
            loss_val,accuracy_val,_ = sess.run(
                [loss,accuracy,train_op])
            print("\r[Train] epoch: %d, step: %d, loss: %3.5f, accuracy: %2.2f" % 
                  (epoch,step,loss_val,accuracy_val),end=" ")

[Train] epoch: 0, step: 0, loss: 2.68249, accuracy: 0.00 [Train] epoch: 0, step: 1, loss: 2.14046, accuracy: 0.20 [Train] epoch: 0, step: 2, loss: 2.00104, accuracy: 0.40 [Train] epoch: 0, step: 3, loss: 1.92572, accuracy: 0.25 [Train] epoch: 0, step: 4, loss: 1.71350, accuracy: 0.25 [Train] epoch: 0, step: 5, loss: 1.50608, accuracy: 0.50 [Train] epoch: 0, step: 6, loss: 1.81894, accuracy: 0.30 [Train] epoch: 0, step: 7, loss: 1.76569, accuracy: 0.45 [Train] epoch: 0, step: 8, loss: 1.22639, accuracy: 0.70 [Train] epoch: 0, step: 9, loss: 1.43902, accuracy: 0.60 [Train] epoch: 0, step: 10, loss: 1.26270, accuracy: 0.65 [Train] epoch: 0, step: 11, loss: 1.06961, accuracy: 0.75 [Train] epoch: 0, step: 12, loss: 1.89877, accuracy: 0.35 [Train] epoch: 0, step: 13, loss: 1.10769, accuracy: 0.55 [Train] epoch: 0, step: 14, loss: 1.38562, accuracy: 0.45 [Train] epoch: 0, step: 15, loss: 0.78346, accuracy: 0.80 [Train] epoch: 0, step: 16, loss: 0.91062, accuracy: 0.70 [Train

[Train] epoch: 0, step: 316, loss: 0.07467, accuracy: 1.00 [Train] epoch: 0, step: 317, loss: 0.28362, accuracy: 0.90 [Train] epoch: 0, step: 318, loss: 0.63038, accuracy: 0.80 [Train] epoch: 0, step: 319, loss: 0.68940, accuracy: 0.70 [Train] epoch: 0, step: 320, loss: 0.57343, accuracy: 0.75 [Train] epoch: 0, step: 321, loss: 0.68528, accuracy: 0.70 [Train] epoch: 0, step: 322, loss: 0.89144, accuracy: 0.60 [Train] epoch: 0, step: 323, loss: 0.55057, accuracy: 0.85 [Train] epoch: 0, step: 324, loss: 0.16495, accuracy: 0.95 [Train] epoch: 0, step: 325, loss: 0.36146, accuracy: 0.85 [Train] epoch: 0, step: 326, loss: 1.01198, accuracy: 0.65 [Train] epoch: 0, step: 327, loss: 0.82733, accuracy: 0.65 [Train] epoch: 0, step: 328, loss: 0.55182, accuracy: 0.65 [Train] epoch: 0, step: 329, loss: 0.87606, accuracy: 0.85 [Train] epoch: 0, step: 330, loss: 0.52761, accuracy: 0.70 [Train] epoch: 0, step: 331, loss: 0.36959, accuracy: 0.90 [Train] epoch: 0, step: 332, loss: 0.59

[Train] epoch: 0, step: 637, loss: 0.69590, accuracy: 0.75 [Train] epoch: 0, step: 638, loss: 0.44487, accuracy: 0.80 [Train] epoch: 0, step: 639, loss: 0.41258, accuracy: 0.90 [Train] epoch: 0, step: 640, loss: 0.66530, accuracy: 0.70 [Train] epoch: 0, step: 641, loss: 0.43515, accuracy: 0.80 [Train] epoch: 0, step: 642, loss: 0.20850, accuracy: 1.00 [Train] epoch: 0, step: 643, loss: 0.54979, accuracy: 0.80 [Train] epoch: 0, step: 644, loss: 0.58805, accuracy: 0.80 [Train] epoch: 0, step: 645, loss: 0.47404, accuracy: 0.85 [Train] epoch: 0, step: 646, loss: 0.57674, accuracy: 0.85 [Train] epoch: 0, step: 647, loss: 0.57408, accuracy: 0.85 [Train] epoch: 0, step: 648, loss: 0.30585, accuracy: 0.90 [Train] epoch: 0, step: 649, loss: 0.81333, accuracy: 0.80 [Train] epoch: 0, step: 650, loss: 0.97574, accuracy: 0.65 [Train] epoch: 0, step: 651, loss: 0.15720, accuracy: 0.95 [Train] epoch: 0, step: 652, loss: 0.84768, accuracy: 0.75 [Train] epoch: 0, step: 653, loss: 0.64

[Train] epoch: 0, step: 952, loss: 0.99301, accuracy: 0.70 [Train] epoch: 0, step: 953, loss: 0.31341, accuracy: 0.85 [Train] epoch: 0, step: 954, loss: 0.55574, accuracy: 0.75 [Train] epoch: 0, step: 955, loss: 0.53846, accuracy: 0.85 [Train] epoch: 0, step: 956, loss: 0.28192, accuracy: 0.90 [Train] epoch: 0, step: 957, loss: 0.48218, accuracy: 0.85 [Train] epoch: 0, step: 958, loss: 0.25230, accuracy: 0.90 [Train] epoch: 0, step: 959, loss: 0.66163, accuracy: 0.70 [Train] epoch: 0, step: 960, loss: 0.33265, accuracy: 0.90 [Train] epoch: 0, step: 961, loss: 0.37393, accuracy: 0.80 [Train] epoch: 0, step: 962, loss: 0.41548, accuracy: 0.90 [Train] epoch: 0, step: 963, loss: 0.53683, accuracy: 0.80 [Train] epoch: 0, step: 964, loss: 0.58037, accuracy: 0.70 [Train] epoch: 0, step: 965, loss: 0.49161, accuracy: 0.80 [Train] epoch: 0, step: 966, loss: 0.57950, accuracy: 0.85 [Train] epoch: 0, step: 967, loss: 0.65849, accuracy: 0.85 [Train] epoch: 0, step: 968, loss: 0.54

[Train] epoch: 0, step: 1261, loss: 0.43043, accuracy: 0.80 [Train] epoch: 0, step: 1262, loss: 0.54700, accuracy: 0.75 [Train] epoch: 0, step: 1263, loss: 0.32990, accuracy: 0.80 [Train] epoch: 0, step: 1264, loss: 0.38675, accuracy: 0.85 [Train] epoch: 0, step: 1265, loss: 0.22469, accuracy: 0.85 [Train] epoch: 0, step: 1266, loss: 0.33177, accuracy: 0.85 [Train] epoch: 0, step: 1267, loss: 0.32243, accuracy: 0.90 [Train] epoch: 0, step: 1268, loss: 0.19139, accuracy: 0.95 [Train] epoch: 0, step: 1269, loss: 0.12758, accuracy: 0.95 [Train] epoch: 0, step: 1270, loss: 0.23029, accuracy: 0.95 [Train] epoch: 0, step: 1271, loss: 0.43357, accuracy: 0.90 [Train] epoch: 0, step: 1272, loss: 0.46032, accuracy: 0.80 [Train] epoch: 0, step: 1273, loss: 0.23055, accuracy: 0.95 [Train] epoch: 0, step: 1274, loss: 0.36110, accuracy: 0.90 [Train] epoch: 0, step: 1275, loss: 0.59001, accuracy: 0.70 [Train] epoch: 0, step: 1276, loss: 0.14449, accuracy: 0.95 [Train] epoch: 0, step:

[Train] epoch: 0, step: 1582, loss: 0.84140, accuracy: 0.65 [Train] epoch: 0, step: 1583, loss: 0.21365, accuracy: 0.95 [Train] epoch: 0, step: 1584, loss: 0.43668, accuracy: 0.85 [Train] epoch: 0, step: 1585, loss: 0.62705, accuracy: 0.70 [Train] epoch: 0, step: 1586, loss: 0.31652, accuracy: 0.85 [Train] epoch: 0, step: 1587, loss: 0.35705, accuracy: 0.85 [Train] epoch: 0, step: 1588, loss: 0.46268, accuracy: 0.75 [Train] epoch: 0, step: 1589, loss: 0.78616, accuracy: 0.75 [Train] epoch: 0, step: 1590, loss: 0.23638, accuracy: 0.90 [Train] epoch: 0, step: 1591, loss: 0.49781, accuracy: 0.80 [Train] epoch: 0, step: 1592, loss: 0.20091, accuracy: 1.00 [Train] epoch: 0, step: 1593, loss: 0.34169, accuracy: 0.80 [Train] epoch: 0, step: 1594, loss: 0.49887, accuracy: 0.70 [Train] epoch: 0, step: 1595, loss: 0.40815, accuracy: 0.70 [Train] epoch: 0, step: 1596, loss: 0.43479, accuracy: 0.85 [Train] epoch: 0, step: 1597, loss: 0.16663, accuracy: 0.95 [Train] epoch: 0, step:

[Train] epoch: 0, step: 1898, loss: 0.28873, accuracy: 0.90 [Train] epoch: 0, step: 1899, loss: 0.72852, accuracy: 0.70 [Train] epoch: 0, step: 1900, loss: 0.35182, accuracy: 0.90 [Train] epoch: 0, step: 1901, loss: 0.29029, accuracy: 0.90 [Train] epoch: 0, step: 1902, loss: 0.24361, accuracy: 0.95 [Train] epoch: 0, step: 1903, loss: 0.20453, accuracy: 0.90 [Train] epoch: 0, step: 1904, loss: 0.55643, accuracy: 0.70 [Train] epoch: 0, step: 1905, loss: 0.31719, accuracy: 0.90 [Train] epoch: 0, step: 1906, loss: 0.16874, accuracy: 0.95 [Train] epoch: 0, step: 1907, loss: 0.15923, accuracy: 0.95 [Train] epoch: 0, step: 1908, loss: 0.48222, accuracy: 0.85 [Train] epoch: 0, step: 1909, loss: 0.46482, accuracy: 0.90 [Train] epoch: 0, step: 1910, loss: 0.73426, accuracy: 0.85 [Train] epoch: 0, step: 1911, loss: 0.27568, accuracy: 0.85 [Train] epoch: 0, step: 1912, loss: 0.40152, accuracy: 0.95 [Train] epoch: 0, step: 1913, loss: 0.45718, accuracy: 0.95 [Train] epoch: 0, step:

[Train] epoch: 0, step: 2212, loss: 0.46638, accuracy: 0.80 [Train] epoch: 0, step: 2213, loss: 0.27074, accuracy: 0.95 [Train] epoch: 0, step: 2214, loss: 0.47477, accuracy: 0.85 [Train] epoch: 0, step: 2215, loss: 0.37195, accuracy: 0.85 [Train] epoch: 0, step: 2216, loss: 0.81927, accuracy: 0.80 [Train] epoch: 0, step: 2217, loss: 0.37992, accuracy: 0.90 [Train] epoch: 0, step: 2218, loss: 0.52065, accuracy: 0.75 [Train] epoch: 0, step: 2219, loss: 0.40718, accuracy: 0.80 [Train] epoch: 0, step: 2220, loss: 0.49181, accuracy: 0.75 [Train] epoch: 0, step: 2221, loss: 0.64917, accuracy: 0.80 [Train] epoch: 0, step: 2222, loss: 0.21032, accuracy: 0.90 [Train] epoch: 0, step: 2223, loss: 0.24126, accuracy: 0.90 [Train] epoch: 0, step: 2224, loss: 0.47047, accuracy: 0.75 [Train] epoch: 0, step: 2225, loss: 0.35912, accuracy: 0.90 [Train] epoch: 0, step: 2226, loss: 0.10880, accuracy: 1.00 [Train] epoch: 0, step: 2227, loss: 0.61199, accuracy: 0.80 [Train] epoch: 0, step:

[Train] epoch: 0, step: 2530, loss: 0.11759, accuracy: 0.95 [Train] epoch: 0, step: 2531, loss: 0.49815, accuracy: 0.90 [Train] epoch: 0, step: 2532, loss: 0.75292, accuracy: 0.65 [Train] epoch: 0, step: 2533, loss: 0.32633, accuracy: 0.85 [Train] epoch: 0, step: 2534, loss: 0.32177, accuracy: 0.80 [Train] epoch: 0, step: 2535, loss: 0.53893, accuracy: 0.85 [Train] epoch: 0, step: 2536, loss: 0.24206, accuracy: 0.90 [Train] epoch: 0, step: 2537, loss: 0.42912, accuracy: 0.85 [Train] epoch: 0, step: 2538, loss: 0.31709, accuracy: 0.85 [Train] epoch: 0, step: 2539, loss: 0.19201, accuracy: 0.95 [Train] epoch: 0, step: 2540, loss: 0.28530, accuracy: 0.95 [Train] epoch: 0, step: 2541, loss: 0.33966, accuracy: 0.85 [Train] epoch: 0, step: 2542, loss: 0.41269, accuracy: 0.80 [Train] epoch: 0, step: 2543, loss: 0.44550, accuracy: 0.75 [Train] epoch: 0, step: 2544, loss: 0.27905, accuracy: 0.90 [Train] epoch: 0, step: 2545, loss: 0.43346, accuracy: 0.80 [Train] epoch: 0, step:

[Train] epoch: 1, step: 98, loss: 0.52546, accuracy: 0.75 [Train] epoch: 1, step: 99, loss: 0.48827, accuracy: 0.80 [Train] epoch: 1, step: 100, loss: 0.42588, accuracy: 0.75 [Train] epoch: 1, step: 101, loss: 0.42072, accuracy: 0.85 [Train] epoch: 1, step: 102, loss: 0.21705, accuracy: 0.90 [Train] epoch: 1, step: 103, loss: 0.20871, accuracy: 0.85 [Train] epoch: 1, step: 104, loss: 0.39624, accuracy: 0.85 [Train] epoch: 1, step: 105, loss: 0.44085, accuracy: 0.85 [Train] epoch: 1, step: 106, loss: 0.14649, accuracy: 0.95 [Train] epoch: 1, step: 107, loss: 0.44101, accuracy: 0.80 [Train] epoch: 1, step: 108, loss: 0.34546, accuracy: 0.95 [Train] epoch: 1, step: 109, loss: 0.51365, accuracy: 0.80 [Train] epoch: 1, step: 110, loss: 0.51381, accuracy: 0.90 [Train] epoch: 1, step: 111, loss: 0.39560, accuracy: 0.85 [Train] epoch: 1, step: 112, loss: 0.32732, accuracy: 0.90 [Train] epoch: 1, step: 113, loss: 0.35617, accuracy: 0.85 [Train] epoch: 1, step: 114, loss: 0.4112

[Train] epoch: 1, step: 418, loss: 0.59536, accuracy: 0.70 [Train] epoch: 1, step: 419, loss: 0.64156, accuracy: 0.80 [Train] epoch: 1, step: 420, loss: 0.29095, accuracy: 0.85 [Train] epoch: 1, step: 421, loss: 0.26958, accuracy: 0.90 [Train] epoch: 1, step: 422, loss: 0.31019, accuracy: 0.85 [Train] epoch: 1, step: 423, loss: 0.33820, accuracy: 0.80 [Train] epoch: 1, step: 424, loss: 0.31640, accuracy: 0.85 [Train] epoch: 1, step: 425, loss: 0.25321, accuracy: 0.90 [Train] epoch: 1, step: 426, loss: 0.44687, accuracy: 0.80 [Train] epoch: 1, step: 427, loss: 0.56029, accuracy: 0.80 [Train] epoch: 1, step: 428, loss: 0.59465, accuracy: 0.80 [Train] epoch: 1, step: 429, loss: 0.48122, accuracy: 0.85 [Train] epoch: 1, step: 430, loss: 0.58848, accuracy: 0.80 [Train] epoch: 1, step: 431, loss: 0.46990, accuracy: 0.80 [Train] epoch: 1, step: 432, loss: 0.54794, accuracy: 0.75 [Train] epoch: 1, step: 433, loss: 0.31349, accuracy: 0.85 [Train] epoch: 1, step: 434, loss: 0.59

[Train] epoch: 1, step: 736, loss: 0.12773, accuracy: 0.95 [Train] epoch: 1, step: 737, loss: 0.18800, accuracy: 0.95 [Train] epoch: 1, step: 738, loss: 0.32229, accuracy: 0.85 [Train] epoch: 1, step: 739, loss: 0.38337, accuracy: 0.75 [Train] epoch: 1, step: 740, loss: 0.79039, accuracy: 0.80 [Train] epoch: 1, step: 741, loss: 0.43239, accuracy: 0.85 [Train] epoch: 1, step: 742, loss: 0.73183, accuracy: 0.70 [Train] epoch: 1, step: 743, loss: 0.24816, accuracy: 0.90 [Train] epoch: 1, step: 744, loss: 0.27172, accuracy: 0.85 [Train] epoch: 1, step: 745, loss: 0.37167, accuracy: 0.80 [Train] epoch: 1, step: 746, loss: 0.46653, accuracy: 0.75 [Train] epoch: 1, step: 747, loss: 0.36618, accuracy: 0.80 [Train] epoch: 1, step: 748, loss: 0.32043, accuracy: 0.85 [Train] epoch: 1, step: 749, loss: 0.59666, accuracy: 0.80 [Train] epoch: 1, step: 750, loss: 0.15763, accuracy: 1.00 [Train] epoch: 1, step: 751, loss: 0.41276, accuracy: 0.80 [Train] epoch: 1, step: 752, loss: 0.22

[Train] epoch: 1, step: 1043, loss: 0.21684, accuracy: 0.90 [Train] epoch: 1, step: 1044, loss: 0.56358, accuracy: 0.80 [Train] epoch: 1, step: 1045, loss: 0.13357, accuracy: 1.00 [Train] epoch: 1, step: 1046, loss: 0.20299, accuracy: 0.95 [Train] epoch: 1, step: 1047, loss: 0.18904, accuracy: 1.00 [Train] epoch: 1, step: 1048, loss: 0.41162, accuracy: 0.80 [Train] epoch: 1, step: 1049, loss: 0.23599, accuracy: 0.85 [Train] epoch: 1, step: 1050, loss: 0.48756, accuracy: 0.85 [Train] epoch: 1, step: 1051, loss: 0.44208, accuracy: 0.75 [Train] epoch: 1, step: 1052, loss: 0.72670, accuracy: 0.80 [Train] epoch: 1, step: 1053, loss: 0.40829, accuracy: 0.85 [Train] epoch: 1, step: 1054, loss: 0.33194, accuracy: 0.85 [Train] epoch: 1, step: 1055, loss: 0.46017, accuracy: 0.80 [Train] epoch: 1, step: 1056, loss: 0.29736, accuracy: 0.90 [Train] epoch: 1, step: 1057, loss: 0.36223, accuracy: 0.90 [Train] epoch: 1, step: 1058, loss: 0.14620, accuracy: 0.95 [Train] epoch: 1, step:

[Train] epoch: 1, step: 1358, loss: 0.44469, accuracy: 0.80 [Train] epoch: 1, step: 1359, loss: 0.14112, accuracy: 0.90 [Train] epoch: 1, step: 1360, loss: 0.36198, accuracy: 0.80 [Train] epoch: 1, step: 1361, loss: 0.34229, accuracy: 0.90 [Train] epoch: 1, step: 1362, loss: 0.61904, accuracy: 0.85 [Train] epoch: 1, step: 1363, loss: 0.31855, accuracy: 0.85 [Train] epoch: 1, step: 1364, loss: 0.09052, accuracy: 1.00 [Train] epoch: 1, step: 1365, loss: 0.56403, accuracy: 0.80 [Train] epoch: 1, step: 1366, loss: 0.28981, accuracy: 0.90 [Train] epoch: 1, step: 1367, loss: 0.18708, accuracy: 0.95 [Train] epoch: 1, step: 1368, loss: 0.30833, accuracy: 0.90 [Train] epoch: 1, step: 1369, loss: 0.27542, accuracy: 0.90 [Train] epoch: 1, step: 1370, loss: 0.71943, accuracy: 0.80 [Train] epoch: 1, step: 1371, loss: 0.32690, accuracy: 0.80 [Train] epoch: 1, step: 1372, loss: 0.28272, accuracy: 0.90 [Train] epoch: 1, step: 1373, loss: 0.18319, accuracy: 0.95 [Train] epoch: 1, step:

[Train] epoch: 1, step: 1670, loss: 0.20194, accuracy: 0.95 [Train] epoch: 1, step: 1671, loss: 0.44835, accuracy: 0.80 [Train] epoch: 1, step: 1672, loss: 0.28422, accuracy: 0.85 [Train] epoch: 1, step: 1673, loss: 0.17649, accuracy: 0.95 [Train] epoch: 1, step: 1674, loss: 0.44158, accuracy: 0.90 [Train] epoch: 1, step: 1675, loss: 0.16128, accuracy: 0.95 [Train] epoch: 1, step: 1676, loss: 0.41340, accuracy: 0.85 [Train] epoch: 1, step: 1677, loss: 0.52529, accuracy: 0.80 [Train] epoch: 1, step: 1678, loss: 0.30063, accuracy: 0.85 [Train] epoch: 1, step: 1679, loss: 0.25832, accuracy: 0.90 [Train] epoch: 1, step: 1680, loss: 0.56433, accuracy: 0.75 [Train] epoch: 1, step: 1681, loss: 0.30518, accuracy: 0.85 [Train] epoch: 1, step: 1682, loss: 0.35034, accuracy: 0.85 [Train] epoch: 1, step: 1683, loss: 0.47971, accuracy: 0.85 [Train] epoch: 1, step: 1684, loss: 0.48540, accuracy: 0.80 [Train] epoch: 1, step: 1685, loss: 0.32012, accuracy: 0.90 [Train] epoch: 1, step:

[Train] epoch: 1, step: 1980, loss: 0.34840, accuracy: 0.90 [Train] epoch: 1, step: 1981, loss: 0.32217, accuracy: 0.80 [Train] epoch: 1, step: 1982, loss: 0.26047, accuracy: 0.95 [Train] epoch: 1, step: 1983, loss: 0.34285, accuracy: 0.95 [Train] epoch: 1, step: 1984, loss: 0.17922, accuracy: 0.95 [Train] epoch: 1, step: 1985, loss: 0.14274, accuracy: 0.95 [Train] epoch: 1, step: 1986, loss: 0.18369, accuracy: 0.95 [Train] epoch: 1, step: 1987, loss: 0.57831, accuracy: 0.80 [Train] epoch: 1, step: 1988, loss: 0.78508, accuracy: 0.80 [Train] epoch: 1, step: 1989, loss: 0.55522, accuracy: 0.80 [Train] epoch: 1, step: 1990, loss: 0.26462, accuracy: 0.90 [Train] epoch: 1, step: 1991, loss: 0.87792, accuracy: 0.70 [Train] epoch: 1, step: 1992, loss: 0.16826, accuracy: 0.90 [Train] epoch: 1, step: 1993, loss: 0.20366, accuracy: 0.95 [Train] epoch: 1, step: 1994, loss: 0.27135, accuracy: 0.90 [Train] epoch: 1, step: 1995, loss: 0.57887, accuracy: 0.85 [Train] epoch: 1, step:

[Train] epoch: 1, step: 2294, loss: 0.25120, accuracy: 0.85 [Train] epoch: 1, step: 2295, loss: 0.55478, accuracy: 0.70 [Train] epoch: 1, step: 2296, loss: 0.10355, accuracy: 1.00 [Train] epoch: 1, step: 2297, loss: 0.25620, accuracy: 0.90 [Train] epoch: 1, step: 2298, loss: 0.23653, accuracy: 0.95 [Train] epoch: 1, step: 2299, loss: 0.26638, accuracy: 0.90 [Train] epoch: 1, step: 2300, loss: 0.71095, accuracy: 0.65 [Train] epoch: 1, step: 2301, loss: 0.27954, accuracy: 0.80 [Train] epoch: 1, step: 2302, loss: 0.18646, accuracy: 0.95 [Train] epoch: 1, step: 2303, loss: 0.32652, accuracy: 0.85 [Train] epoch: 1, step: 2304, loss: 0.11627, accuracy: 0.95 [Train] epoch: 1, step: 2305, loss: 0.39076, accuracy: 0.80 [Train] epoch: 1, step: 2306, loss: 0.49653, accuracy: 0.85 [Train] epoch: 1, step: 2307, loss: 0.42404, accuracy: 0.80 [Train] epoch: 1, step: 2308, loss: 0.53763, accuracy: 0.75 [Train] epoch: 1, step: 2309, loss: 0.32772, accuracy: 0.80 [Train] epoch: 1, step:

[Train] epoch: 1, step: 2595, loss: 0.41428, accuracy: 0.75 [Train] epoch: 1, step: 2596, loss: 0.24329, accuracy: 0.95 [Train] epoch: 1, step: 2597, loss: 0.28576, accuracy: 0.95 [Train] epoch: 1, step: 2598, loss: 0.56193, accuracy: 0.70 [Train] epoch: 1, step: 2599, loss: 0.36787, accuracy: 0.85 [Train] epoch: 1, step: 2600, loss: 0.27370, accuracy: 0.80 [Train] epoch: 1, step: 2601, loss: 0.50459, accuracy: 0.80 [Train] epoch: 1, step: 2602, loss: 0.34646, accuracy: 0.75 [Train] epoch: 1, step: 2603, loss: 0.61036, accuracy: 0.75 [Train] epoch: 1, step: 2604, loss: 0.40847, accuracy: 0.80 [Train] epoch: 1, step: 2605, loss: 0.46231, accuracy: 0.75 [Train] epoch: 1, step: 2606, loss: 0.36933, accuracy: 0.85 [Train] epoch: 1, step: 2607, loss: 0.64239, accuracy: 0.85 [Train] epoch: 1, step: 2608, loss: 0.72825, accuracy: 0.75 [Train] epoch: 1, step: 2609, loss: 0.23792, accuracy: 0.95 [Train] epoch: 1, step: 2610, loss: 0.72758, accuracy: 0.70 [Train] epoch: 1, step:

[Train] epoch: 2, step: 151, loss: 0.29870, accuracy: 0.90 [Train] epoch: 2, step: 152, loss: 0.52429, accuracy: 0.75 [Train] epoch: 2, step: 153, loss: 0.26051, accuracy: 0.85 [Train] epoch: 2, step: 154, loss: 0.22698, accuracy: 0.90 [Train] epoch: 2, step: 155, loss: 0.33970, accuracy: 0.90 [Train] epoch: 2, step: 156, loss: 0.44554, accuracy: 0.80 [Train] epoch: 2, step: 157, loss: 0.33175, accuracy: 0.85 [Train] epoch: 2, step: 158, loss: 0.09543, accuracy: 1.00 [Train] epoch: 2, step: 159, loss: 0.27981, accuracy: 0.85 [Train] epoch: 2, step: 160, loss: 0.29619, accuracy: 0.85 [Train] epoch: 2, step: 161, loss: 0.25001, accuracy: 0.90 [Train] epoch: 2, step: 162, loss: 0.32319, accuracy: 0.90 [Train] epoch: 2, step: 163, loss: 0.42000, accuracy: 0.90 [Train] epoch: 2, step: 164, loss: 0.35126, accuracy: 0.90 [Train] epoch: 2, step: 165, loss: 0.57736, accuracy: 0.75 [Train] epoch: 2, step: 166, loss: 0.54467, accuracy: 0.80 [Train] epoch: 2, step: 167, loss: 0.25

[Train] epoch: 2, step: 456, loss: 0.20769, accuracy: 0.95 [Train] epoch: 2, step: 457, loss: 0.53085, accuracy: 0.80 [Train] epoch: 2, step: 458, loss: 0.47146, accuracy: 0.80 [Train] epoch: 2, step: 459, loss: 0.33198, accuracy: 0.90 [Train] epoch: 2, step: 460, loss: 0.38741, accuracy: 0.80 [Train] epoch: 2, step: 461, loss: 0.11381, accuracy: 1.00 [Train] epoch: 2, step: 462, loss: 0.23672, accuracy: 0.85 [Train] epoch: 2, step: 463, loss: 0.84500, accuracy: 0.75 [Train] epoch: 2, step: 464, loss: 0.22883, accuracy: 0.90 [Train] epoch: 2, step: 465, loss: 0.49414, accuracy: 0.85 [Train] epoch: 2, step: 466, loss: 0.35695, accuracy: 0.80 [Train] epoch: 2, step: 467, loss: 0.39956, accuracy: 0.90 [Train] epoch: 2, step: 468, loss: 0.18589, accuracy: 0.95 [Train] epoch: 2, step: 469, loss: 0.16309, accuracy: 0.95 [Train] epoch: 2, step: 470, loss: 0.15992, accuracy: 0.95 [Train] epoch: 2, step: 471, loss: 0.40128, accuracy: 0.85 [Train] epoch: 2, step: 472, loss: 0.52

[Train] epoch: 2, step: 761, loss: 0.28037, accuracy: 0.80 [Train] epoch: 2, step: 762, loss: 0.44799, accuracy: 0.75 [Train] epoch: 2, step: 763, loss: 0.12875, accuracy: 0.95 [Train] epoch: 2, step: 764, loss: 0.32766, accuracy: 0.85 [Train] epoch: 2, step: 765, loss: 0.39051, accuracy: 0.90 [Train] epoch: 2, step: 766, loss: 0.35346, accuracy: 0.90 [Train] epoch: 2, step: 767, loss: 0.38996, accuracy: 0.85 [Train] epoch: 2, step: 768, loss: 0.09723, accuracy: 1.00 [Train] epoch: 2, step: 769, loss: 0.10457, accuracy: 1.00 [Train] epoch: 2, step: 770, loss: 0.37357, accuracy: 0.85 [Train] epoch: 2, step: 771, loss: 0.46143, accuracy: 0.60 [Train] epoch: 2, step: 772, loss: 0.28928, accuracy: 0.95 [Train] epoch: 2, step: 773, loss: 0.20190, accuracy: 0.90 [Train] epoch: 2, step: 774, loss: 0.69904, accuracy: 0.85 [Train] epoch: 2, step: 775, loss: 0.08809, accuracy: 0.95 [Train] epoch: 2, step: 776, loss: 0.30328, accuracy: 0.90 [Train] epoch: 2, step: 777, loss: 0.81

[Train] epoch: 2, step: 1063, loss: 0.44875, accuracy: 0.85 [Train] epoch: 2, step: 1064, loss: 0.25650, accuracy: 0.85 [Train] epoch: 2, step: 1065, loss: 0.36322, accuracy: 0.85 [Train] epoch: 2, step: 1066, loss: 0.31272, accuracy: 0.80 [Train] epoch: 2, step: 1067, loss: 0.25482, accuracy: 0.90 [Train] epoch: 2, step: 1068, loss: 0.14159, accuracy: 0.95 [Train] epoch: 2, step: 1069, loss: 0.32040, accuracy: 0.85 [Train] epoch: 2, step: 1070, loss: 0.15095, accuracy: 0.95 [Train] epoch: 2, step: 1071, loss: 0.47371, accuracy: 0.75 [Train] epoch: 2, step: 1072, loss: 0.36681, accuracy: 0.85 [Train] epoch: 2, step: 1073, loss: 0.21932, accuracy: 0.90 [Train] epoch: 2, step: 1074, loss: 0.11821, accuracy: 1.00 [Train] epoch: 2, step: 1075, loss: 0.27211, accuracy: 0.80 [Train] epoch: 2, step: 1076, loss: 0.28970, accuracy: 0.85 [Train] epoch: 2, step: 1077, loss: 0.25415, accuracy: 0.90 [Train] epoch: 2, step: 1078, loss: 0.08688, accuracy: 1.00 [Train] epoch: 2, step:

[Train] epoch: 2, step: 1366, loss: 0.21805, accuracy: 0.90 [Train] epoch: 2, step: 1367, loss: 0.12781, accuracy: 0.95 [Train] epoch: 2, step: 1368, loss: 0.33584, accuracy: 0.90 [Train] epoch: 2, step: 1369, loss: 0.31008, accuracy: 0.90 [Train] epoch: 2, step: 1370, loss: 0.54744, accuracy: 0.80 [Train] epoch: 2, step: 1371, loss: 0.27003, accuracy: 0.80 [Train] epoch: 2, step: 1372, loss: 0.22729, accuracy: 0.90 [Train] epoch: 2, step: 1373, loss: 0.16173, accuracy: 0.95 [Train] epoch: 2, step: 1374, loss: 0.29086, accuracy: 0.95 [Train] epoch: 2, step: 1375, loss: 0.42179, accuracy: 0.85 [Train] epoch: 2, step: 1376, loss: 0.02280, accuracy: 1.00 [Train] epoch: 2, step: 1377, loss: 0.12988, accuracy: 0.95 [Train] epoch: 2, step: 1378, loss: 0.22520, accuracy: 0.90 [Train] epoch: 2, step: 1379, loss: 0.10032, accuracy: 1.00 [Train] epoch: 2, step: 1380, loss: 0.32453, accuracy: 0.90 [Train] epoch: 2, step: 1381, loss: 0.05917, accuracy: 1.00 [Train] epoch: 2, step:

[Train] epoch: 2, step: 1663, loss: 0.39705, accuracy: 0.80 [Train] epoch: 2, step: 1664, loss: 0.06472, accuracy: 1.00 [Train] epoch: 2, step: 1665, loss: 0.26197, accuracy: 0.90 [Train] epoch: 2, step: 1666, loss: 0.28253, accuracy: 0.85 [Train] epoch: 2, step: 1667, loss: 0.29485, accuracy: 0.85 [Train] epoch: 2, step: 1668, loss: 0.20451, accuracy: 0.95 [Train] epoch: 2, step: 1669, loss: 0.15720, accuracy: 1.00 [Train] epoch: 2, step: 1670, loss: 0.09309, accuracy: 1.00 [Train] epoch: 2, step: 1671, loss: 0.46488, accuracy: 0.80 [Train] epoch: 2, step: 1672, loss: 0.16362, accuracy: 0.90 [Train] epoch: 2, step: 1673, loss: 0.17505, accuracy: 0.95 [Train] epoch: 2, step: 1674, loss: 0.55856, accuracy: 0.90 [Train] epoch: 2, step: 1675, loss: 0.13467, accuracy: 0.95 [Train] epoch: 2, step: 1676, loss: 0.32029, accuracy: 0.85 [Train] epoch: 2, step: 1677, loss: 0.45476, accuracy: 0.80 [Train] epoch: 2, step: 1678, loss: 0.29987, accuracy: 0.85 [Train] epoch: 2, step:

[Train] epoch: 2, step: 1965, loss: 0.05067, accuracy: 1.00 [Train] epoch: 2, step: 1966, loss: 0.60465, accuracy: 0.80 [Train] epoch: 2, step: 1967, loss: 0.87127, accuracy: 0.80 [Train] epoch: 2, step: 1968, loss: 0.15143, accuracy: 0.90 [Train] epoch: 2, step: 1969, loss: 0.45892, accuracy: 0.90 [Train] epoch: 2, step: 1970, loss: 0.46594, accuracy: 0.75 [Train] epoch: 2, step: 1971, loss: 0.26687, accuracy: 0.95 [Train] epoch: 2, step: 1972, loss: 0.29040, accuracy: 0.90 [Train] epoch: 2, step: 1973, loss: 0.13454, accuracy: 0.95 [Train] epoch: 2, step: 1974, loss: 0.30805, accuracy: 0.95 [Train] epoch: 2, step: 1975, loss: 0.42474, accuracy: 0.80 [Train] epoch: 2, step: 1976, loss: 0.13656, accuracy: 0.95 [Train] epoch: 2, step: 1977, loss: 0.41421, accuracy: 0.95 [Train] epoch: 2, step: 1978, loss: 0.37996, accuracy: 0.90 [Train] epoch: 2, step: 1979, loss: 0.14508, accuracy: 0.95 [Train] epoch: 2, step: 1980, loss: 0.23965, accuracy: 0.95 [Train] epoch: 2, step:

[Train] epoch: 2, step: 2263, loss: 0.37427, accuracy: 0.80 [Train] epoch: 2, step: 2264, loss: 0.31508, accuracy: 0.90 [Train] epoch: 2, step: 2265, loss: 0.33139, accuracy: 0.85 [Train] epoch: 2, step: 2266, loss: 0.22048, accuracy: 0.95 [Train] epoch: 2, step: 2267, loss: 0.31867, accuracy: 0.80 [Train] epoch: 2, step: 2268, loss: 0.38609, accuracy: 0.85 [Train] epoch: 2, step: 2269, loss: 0.40106, accuracy: 0.90 [Train] epoch: 2, step: 2270, loss: 0.19869, accuracy: 0.90 [Train] epoch: 2, step: 2271, loss: 0.35438, accuracy: 0.85 [Train] epoch: 2, step: 2272, loss: 0.10028, accuracy: 0.95 [Train] epoch: 2, step: 2273, loss: 0.35191, accuracy: 0.85 [Train] epoch: 2, step: 2274, loss: 0.25444, accuracy: 0.90 [Train] epoch: 2, step: 2275, loss: 0.19254, accuracy: 1.00 [Train] epoch: 2, step: 2276, loss: 0.31029, accuracy: 0.85 [Train] epoch: 2, step: 2277, loss: 0.23550, accuracy: 0.95 [Train] epoch: 2, step: 2278, loss: 0.12530, accuracy: 1.00 [Train] epoch: 2, step:

[Train] epoch: 2, step: 2568, loss: 0.31796, accuracy: 0.85 [Train] epoch: 2, step: 2569, loss: 0.20601, accuracy: 0.90 [Train] epoch: 2, step: 2570, loss: 0.09844, accuracy: 1.00 [Train] epoch: 2, step: 2571, loss: 0.28712, accuracy: 0.90 [Train] epoch: 2, step: 2572, loss: 0.55127, accuracy: 0.80 [Train] epoch: 2, step: 2573, loss: 0.27471, accuracy: 0.85 [Train] epoch: 2, step: 2574, loss: 0.36134, accuracy: 0.80 [Train] epoch: 2, step: 2575, loss: 0.48869, accuracy: 0.90 [Train] epoch: 2, step: 2576, loss: 0.29081, accuracy: 0.95 [Train] epoch: 2, step: 2577, loss: 0.43573, accuracy: 0.80 [Train] epoch: 2, step: 2578, loss: 0.25609, accuracy: 0.85 [Train] epoch: 2, step: 2579, loss: 0.41896, accuracy: 0.85 [Train] epoch: 2, step: 2580, loss: 0.33160, accuracy: 0.85 [Train] epoch: 2, step: 2581, loss: 0.35603, accuracy: 0.95 [Train] epoch: 2, step: 2582, loss: 0.07140, accuracy: 1.00 [Train] epoch: 2, step: 2583, loss: 0.27692, accuracy: 0.90 [Train] epoch: 2, step:

[Train] epoch: 3, step: 124, loss: 0.21347, accuracy: 0.90 [Train] epoch: 3, step: 125, loss: 0.27448, accuracy: 0.95 [Train] epoch: 3, step: 126, loss: 0.43575, accuracy: 0.90 [Train] epoch: 3, step: 127, loss: 0.13679, accuracy: 0.95 [Train] epoch: 3, step: 128, loss: 0.16628, accuracy: 0.90 [Train] epoch: 3, step: 129, loss: 0.32505, accuracy: 0.80 [Train] epoch: 3, step: 130, loss: 0.53577, accuracy: 0.75 [Train] epoch: 3, step: 131, loss: 0.52077, accuracy: 0.85 [Train] epoch: 3, step: 132, loss: 0.25681, accuracy: 0.85 [Train] epoch: 3, step: 133, loss: 0.79531, accuracy: 0.65 [Train] epoch: 3, step: 134, loss: 0.21602, accuracy: 0.90 [Train] epoch: 3, step: 135, loss: 0.33310, accuracy: 0.90 [Train] epoch: 3, step: 136, loss: 0.13302, accuracy: 1.00 [Train] epoch: 3, step: 137, loss: 0.45968, accuracy: 0.80 [Train] epoch: 3, step: 138, loss: 0.43876, accuracy: 0.75 [Train] epoch: 3, step: 139, loss: 0.16535, accuracy: 0.95 [Train] epoch: 3, step: 140, loss: 0.11

[Train] epoch: 3, step: 428, loss: 0.43037, accuracy: 0.75 [Train] epoch: 3, step: 429, loss: 0.68234, accuracy: 0.80 [Train] epoch: 3, step: 430, loss: 0.48991, accuracy: 0.80 [Train] epoch: 3, step: 431, loss: 0.43139, accuracy: 0.85 [Train] epoch: 3, step: 432, loss: 0.44555, accuracy: 0.80 [Train] epoch: 3, step: 433, loss: 0.31322, accuracy: 0.80 [Train] epoch: 3, step: 434, loss: 0.43446, accuracy: 0.80 [Train] epoch: 3, step: 435, loss: 0.31205, accuracy: 0.95 [Train] epoch: 3, step: 436, loss: 0.22849, accuracy: 0.85 [Train] epoch: 3, step: 437, loss: 0.14733, accuracy: 1.00 [Train] epoch: 3, step: 438, loss: 0.36969, accuracy: 0.90 [Train] epoch: 3, step: 439, loss: 0.28803, accuracy: 0.90 [Train] epoch: 3, step: 440, loss: 0.22548, accuracy: 0.95 [Train] epoch: 3, step: 441, loss: 0.26570, accuracy: 0.90 [Train] epoch: 3, step: 442, loss: 0.26616, accuracy: 0.90 [Train] epoch: 3, step: 443, loss: 0.45228, accuracy: 0.85 [Train] epoch: 3, step: 444, loss: 0.34

[Train] epoch: 3, step: 730, loss: 0.17102, accuracy: 0.90 [Train] epoch: 3, step: 731, loss: 0.11348, accuracy: 1.00 [Train] epoch: 3, step: 732, loss: 0.14685, accuracy: 0.95 [Train] epoch: 3, step: 733, loss: 0.09629, accuracy: 1.00 [Train] epoch: 3, step: 734, loss: 0.14350, accuracy: 0.95 [Train] epoch: 3, step: 735, loss: 0.55929, accuracy: 0.75 [Train] epoch: 3, step: 736, loss: 0.10886, accuracy: 1.00 [Train] epoch: 3, step: 737, loss: 0.22910, accuracy: 0.95 [Train] epoch: 3, step: 738, loss: 0.08503, accuracy: 1.00 [Train] epoch: 3, step: 739, loss: 0.22067, accuracy: 0.90 [Train] epoch: 3, step: 740, loss: 0.75904, accuracy: 0.80 [Train] epoch: 3, step: 741, loss: 0.28954, accuracy: 0.90 [Train] epoch: 3, step: 742, loss: 0.77269, accuracy: 0.80 [Train] epoch: 3, step: 743, loss: 0.20107, accuracy: 0.95 [Train] epoch: 3, step: 744, loss: 0.24311, accuracy: 0.95 [Train] epoch: 3, step: 745, loss: 0.22956, accuracy: 0.90 [Train] epoch: 3, step: 746, loss: 0.54

[Train] epoch: 3, step: 1025, loss: 0.59754, accuracy: 0.80 [Train] epoch: 3, step: 1026, loss: 0.15658, accuracy: 0.95 [Train] epoch: 3, step: 1027, loss: 0.48225, accuracy: 0.75 [Train] epoch: 3, step: 1028, loss: 0.47328, accuracy: 0.90 [Train] epoch: 3, step: 1029, loss: 0.47670, accuracy: 0.90 [Train] epoch: 3, step: 1030, loss: 0.45858, accuracy: 0.85 [Train] epoch: 3, step: 1031, loss: 0.28777, accuracy: 0.80 [Train] epoch: 3, step: 1032, loss: 0.20666, accuracy: 0.95 [Train] epoch: 3, step: 1033, loss: 0.43962, accuracy: 0.80 [Train] epoch: 3, step: 1034, loss: 0.15315, accuracy: 0.95 [Train] epoch: 3, step: 1035, loss: 0.27639, accuracy: 0.85 [Train] epoch: 3, step: 1036, loss: 0.07483, accuracy: 1.00 [Train] epoch: 3, step: 1037, loss: 0.23820, accuracy: 0.85 [Train] epoch: 3, step: 1038, loss: 0.40419, accuracy: 0.85 [Train] epoch: 3, step: 1039, loss: 0.51194, accuracy: 0.70 [Train] epoch: 3, step: 1040, loss: 0.32684, accuracy: 0.85 [Train] epoch: 3, step:

[Train] epoch: 3, step: 1330, loss: 0.23966, accuracy: 0.95 [Train] epoch: 3, step: 1331, loss: 0.22516, accuracy: 0.90 [Train] epoch: 3, step: 1332, loss: 0.42522, accuracy: 0.80 [Train] epoch: 3, step: 1333, loss: 0.44242, accuracy: 0.85 [Train] epoch: 3, step: 1334, loss: 0.34623, accuracy: 0.90 [Train] epoch: 3, step: 1335, loss: 0.45285, accuracy: 0.85 [Train] epoch: 3, step: 1336, loss: 0.18993, accuracy: 0.90 [Train] epoch: 3, step: 1337, loss: 0.24693, accuracy: 0.90 [Train] epoch: 3, step: 1338, loss: 0.49518, accuracy: 0.75 [Train] epoch: 3, step: 1339, loss: 0.12232, accuracy: 1.00 [Train] epoch: 3, step: 1340, loss: 0.11864, accuracy: 0.90 [Train] epoch: 3, step: 1341, loss: 0.15853, accuracy: 0.90 [Train] epoch: 3, step: 1342, loss: 0.16688, accuracy: 0.95 [Train] epoch: 3, step: 1343, loss: 0.30969, accuracy: 0.85 [Train] epoch: 3, step: 1344, loss: 0.17095, accuracy: 0.95 [Train] epoch: 3, step: 1345, loss: 0.13905, accuracy: 0.95 [Train] epoch: 3, step:

[Train] epoch: 3, step: 1637, loss: 0.37289, accuracy: 0.85 [Train] epoch: 3, step: 1638, loss: 0.14711, accuracy: 0.95 [Train] epoch: 3, step: 1639, loss: 0.23210, accuracy: 0.90 [Train] epoch: 3, step: 1640, loss: 0.28963, accuracy: 0.85 [Train] epoch: 3, step: 1641, loss: 0.17274, accuracy: 0.95 [Train] epoch: 3, step: 1642, loss: 0.12611, accuracy: 0.95 [Train] epoch: 3, step: 1643, loss: 0.19327, accuracy: 0.90 [Train] epoch: 3, step: 1644, loss: 0.34968, accuracy: 0.90 [Train] epoch: 3, step: 1645, loss: 0.47273, accuracy: 0.85 [Train] epoch: 3, step: 1646, loss: 0.47871, accuracy: 0.80 [Train] epoch: 3, step: 1647, loss: 0.43582, accuracy: 0.85 [Train] epoch: 3, step: 1648, loss: 0.29802, accuracy: 0.90 [Train] epoch: 3, step: 1649, loss: 0.14710, accuracy: 1.00 [Train] epoch: 3, step: 1650, loss: 0.26370, accuracy: 0.90 [Train] epoch: 3, step: 1651, loss: 0.31656, accuracy: 0.85 [Train] epoch: 3, step: 1652, loss: 0.23902, accuracy: 0.95 [Train] epoch: 3, step:

[Train] epoch: 3, step: 1944, loss: 0.24185, accuracy: 0.85 [Train] epoch: 3, step: 1945, loss: 0.24611, accuracy: 0.90 [Train] epoch: 3, step: 1946, loss: 0.22897, accuracy: 0.95 [Train] epoch: 3, step: 1947, loss: 0.28407, accuracy: 0.90 [Train] epoch: 3, step: 1948, loss: 0.25488, accuracy: 0.90 [Train] epoch: 3, step: 1949, loss: 0.55563, accuracy: 0.90 [Train] epoch: 3, step: 1950, loss: 0.14201, accuracy: 0.95 [Train] epoch: 3, step: 1951, loss: 0.04843, accuracy: 1.00 [Train] epoch: 3, step: 1952, loss: 0.13474, accuracy: 0.95 [Train] epoch: 3, step: 1953, loss: 0.12777, accuracy: 1.00 [Train] epoch: 3, step: 1954, loss: 0.26566, accuracy: 0.95 [Train] epoch: 3, step: 1955, loss: 0.63717, accuracy: 0.70 [Train] epoch: 3, step: 1956, loss: 0.26524, accuracy: 0.90 [Train] epoch: 3, step: 1957, loss: 0.23187, accuracy: 0.95 [Train] epoch: 3, step: 1958, loss: 0.16701, accuracy: 0.90 [Train] epoch: 3, step: 1959, loss: 0.16041, accuracy: 0.95 [Train] epoch: 3, step:

[Train] epoch: 3, step: 2250, loss: 0.47836, accuracy: 0.90 [Train] epoch: 3, step: 2251, loss: 0.59327, accuracy: 0.85 [Train] epoch: 3, step: 2252, loss: 0.47466, accuracy: 0.85 [Train] epoch: 3, step: 2253, loss: 0.34420, accuracy: 0.80 [Train] epoch: 3, step: 2254, loss: 0.19537, accuracy: 0.95 [Train] epoch: 3, step: 2255, loss: 0.23336, accuracy: 0.90 [Train] epoch: 3, step: 2256, loss: 0.18952, accuracy: 0.95 [Train] epoch: 3, step: 2257, loss: 0.48032, accuracy: 0.80 [Train] epoch: 3, step: 2258, loss: 0.25019, accuracy: 0.90 [Train] epoch: 3, step: 2259, loss: 0.27272, accuracy: 0.75 [Train] epoch: 3, step: 2260, loss: 0.35033, accuracy: 0.85 [Train] epoch: 3, step: 2261, loss: 0.52676, accuracy: 0.85 [Train] epoch: 3, step: 2262, loss: 0.26464, accuracy: 0.90 [Train] epoch: 3, step: 2263, loss: 0.37001, accuracy: 0.90 [Train] epoch: 3, step: 2264, loss: 0.27526, accuracy: 0.85 [Train] epoch: 3, step: 2265, loss: 0.30081, accuracy: 0.85 [Train] epoch: 3, step:

[Train] epoch: 3, step: 2552, loss: 0.37744, accuracy: 0.90 [Train] epoch: 3, step: 2553, loss: 0.24715, accuracy: 0.90 [Train] epoch: 3, step: 2554, loss: 0.20687, accuracy: 0.90 [Train] epoch: 3, step: 2555, loss: 0.25506, accuracy: 0.90 [Train] epoch: 3, step: 2556, loss: 0.57441, accuracy: 0.75 [Train] epoch: 3, step: 2557, loss: 0.33224, accuracy: 0.80 [Train] epoch: 3, step: 2558, loss: 0.14664, accuracy: 0.95 [Train] epoch: 3, step: 2559, loss: 0.28937, accuracy: 0.90 [Train] epoch: 3, step: 2560, loss: 0.24069, accuracy: 0.90 [Train] epoch: 3, step: 2561, loss: 0.17164, accuracy: 0.90 [Train] epoch: 3, step: 2562, loss: 0.07253, accuracy: 1.00 [Train] epoch: 3, step: 2563, loss: 0.39388, accuracy: 0.85 [Train] epoch: 3, step: 2564, loss: 0.21045, accuracy: 0.90 [Train] epoch: 3, step: 2565, loss: 0.37853, accuracy: 0.90 [Train] epoch: 3, step: 2566, loss: 0.23368, accuracy: 0.90 [Train] epoch: 3, step: 2567, loss: 0.28517, accuracy: 0.90 [Train] epoch: 3, step:

[Train] epoch: 4, step: 84, loss: 0.11600, accuracy: 0.95 [Train] epoch: 4, step: 85, loss: 0.28086, accuracy: 0.90 [Train] epoch: 4, step: 86, loss: 0.15554, accuracy: 0.95 [Train] epoch: 4, step: 87, loss: 0.12010, accuracy: 0.95 [Train] epoch: 4, step: 88, loss: 0.23155, accuracy: 0.90 [Train] epoch: 4, step: 89, loss: 0.14824, accuracy: 0.95 [Train] epoch: 4, step: 90, loss: 0.35306, accuracy: 0.90 [Train] epoch: 4, step: 91, loss: 0.17554, accuracy: 0.95 [Train] epoch: 4, step: 92, loss: 0.31052, accuracy: 0.95 [Train] epoch: 4, step: 93, loss: 0.28611, accuracy: 0.85 [Train] epoch: 4, step: 94, loss: 0.42292, accuracy: 0.80 [Train] epoch: 4, step: 95, loss: 0.14194, accuracy: 0.95 [Train] epoch: 4, step: 96, loss: 0.20405, accuracy: 0.95 [Train] epoch: 4, step: 97, loss: 0.32027, accuracy: 0.85 [Train] epoch: 4, step: 98, loss: 0.57396, accuracy: 0.75 [Train] epoch: 4, step: 99, loss: 0.30105, accuracy: 0.80 [Train] epoch: 4, step: 100, loss: 0.18662, accuracy: 0

[Train] epoch: 4, step: 385, loss: 0.36355, accuracy: 0.85 [Train] epoch: 4, step: 386, loss: 0.28934, accuracy: 0.80 [Train] epoch: 4, step: 387, loss: 0.68811, accuracy: 0.85 [Train] epoch: 4, step: 388, loss: 0.14768, accuracy: 0.95 [Train] epoch: 4, step: 389, loss: 0.34275, accuracy: 0.80 [Train] epoch: 4, step: 390, loss: 0.32877, accuracy: 0.85 [Train] epoch: 4, step: 391, loss: 0.23857, accuracy: 0.85 [Train] epoch: 4, step: 392, loss: 0.08817, accuracy: 0.95 [Train] epoch: 4, step: 393, loss: 0.25794, accuracy: 0.90 [Train] epoch: 4, step: 394, loss: 0.11236, accuracy: 1.00 [Train] epoch: 4, step: 395, loss: 0.19944, accuracy: 0.90 [Train] epoch: 4, step: 396, loss: 0.40118, accuracy: 0.85 [Train] epoch: 4, step: 397, loss: 0.15687, accuracy: 0.95 [Train] epoch: 4, step: 398, loss: 0.34810, accuracy: 0.85 [Train] epoch: 4, step: 399, loss: 0.26056, accuracy: 0.90 [Train] epoch: 4, step: 400, loss: 0.13023, accuracy: 0.95 [Train] epoch: 4, step: 401, loss: 0.27

[Train] epoch: 4, step: 687, loss: 0.25025, accuracy: 0.90 [Train] epoch: 4, step: 688, loss: 0.18876, accuracy: 0.95 [Train] epoch: 4, step: 689, loss: 0.07029, accuracy: 1.00 [Train] epoch: 4, step: 690, loss: 0.19304, accuracy: 0.90 [Train] epoch: 4, step: 691, loss: 0.14444, accuracy: 0.90 [Train] epoch: 4, step: 692, loss: 0.45519, accuracy: 0.80 [Train] epoch: 4, step: 693, loss: 0.42613, accuracy: 0.90 [Train] epoch: 4, step: 694, loss: 0.26648, accuracy: 0.90 [Train] epoch: 4, step: 695, loss: 0.13346, accuracy: 1.00 [Train] epoch: 4, step: 696, loss: 0.16113, accuracy: 0.90 [Train] epoch: 4, step: 697, loss: 0.34804, accuracy: 0.90 [Train] epoch: 4, step: 698, loss: 0.09658, accuracy: 1.00 [Train] epoch: 4, step: 699, loss: 0.20271, accuracy: 0.95 [Train] epoch: 4, step: 700, loss: 0.49486, accuracy: 0.80 [Train] epoch: 4, step: 701, loss: 0.31282, accuracy: 0.90 [Train] epoch: 4, step: 702, loss: 0.15946, accuracy: 0.95 [Train] epoch: 4, step: 703, loss: 0.50

[Train] epoch: 4, step: 994, loss: 0.27862, accuracy: 0.90 [Train] epoch: 4, step: 995, loss: 0.17415, accuracy: 0.95 [Train] epoch: 4, step: 996, loss: 0.03473, accuracy: 1.00 [Train] epoch: 4, step: 997, loss: 0.24999, accuracy: 0.90 [Train] epoch: 4, step: 998, loss: 0.44879, accuracy: 0.85 [Train] epoch: 4, step: 999, loss: 0.22271, accuracy: 0.90 [Train] epoch: 4, step: 1000, loss: 0.19375, accuracy: 0.90 [Train] epoch: 4, step: 1001, loss: 0.17689, accuracy: 0.95 [Train] epoch: 4, step: 1002, loss: 0.21999, accuracy: 0.95 [Train] epoch: 4, step: 1003, loss: 0.08563, accuracy: 1.00 [Train] epoch: 4, step: 1004, loss: 0.18366, accuracy: 0.95 [Train] epoch: 4, step: 1005, loss: 0.10616, accuracy: 0.95 [Train] epoch: 4, step: 1006, loss: 0.34524, accuracy: 0.85 [Train] epoch: 4, step: 1007, loss: 0.12790, accuracy: 0.95 [Train] epoch: 4, step: 1008, loss: 0.12977, accuracy: 0.95 [Train] epoch: 4, step: 1009, loss: 0.12732, accuracy: 0.95 [Train] epoch: 4, step: 1010,

[Train] epoch: 4, step: 1299, loss: 0.49966, accuracy: 0.85 [Train] epoch: 4, step: 1300, loss: 0.47037, accuracy: 0.90 [Train] epoch: 4, step: 1301, loss: 0.10049, accuracy: 1.00 [Train] epoch: 4, step: 1302, loss: 0.22767, accuracy: 0.90 [Train] epoch: 4, step: 1303, loss: 0.01580, accuracy: 1.00 [Train] epoch: 4, step: 1304, loss: 0.10008, accuracy: 1.00 [Train] epoch: 4, step: 1305, loss: 0.25208, accuracy: 0.90 [Train] epoch: 4, step: 1306, loss: 0.72032, accuracy: 0.65 [Train] epoch: 4, step: 1307, loss: 0.24142, accuracy: 0.95 [Train] epoch: 4, step: 1308, loss: 0.33505, accuracy: 0.90 [Train] epoch: 4, step: 1309, loss: 0.09003, accuracy: 0.95 [Train] epoch: 4, step: 1310, loss: 0.56991, accuracy: 0.75 [Train] epoch: 4, step: 1311, loss: 0.26034, accuracy: 0.90 [Train] epoch: 4, step: 1312, loss: 0.64357, accuracy: 0.80 [Train] epoch: 4, step: 1313, loss: 0.53837, accuracy: 0.80 [Train] epoch: 4, step: 1314, loss: 0.28017, accuracy: 0.90 [Train] epoch: 4, step:

[Train] epoch: 4, step: 1605, loss: 0.26228, accuracy: 0.90 [Train] epoch: 4, step: 1606, loss: 0.19063, accuracy: 0.90 [Train] epoch: 4, step: 1607, loss: 0.30111, accuracy: 0.95 [Train] epoch: 4, step: 1608, loss: 0.11286, accuracy: 0.95 [Train] epoch: 4, step: 1609, loss: 0.12556, accuracy: 0.95 [Train] epoch: 4, step: 1610, loss: 0.23290, accuracy: 0.85 [Train] epoch: 4, step: 1611, loss: 0.10266, accuracy: 1.00 [Train] epoch: 4, step: 1612, loss: 0.51450, accuracy: 0.80 [Train] epoch: 4, step: 1613, loss: 0.40717, accuracy: 0.80 [Train] epoch: 4, step: 1614, loss: 0.23635, accuracy: 0.95 [Train] epoch: 4, step: 1615, loss: 0.47951, accuracy: 0.80 [Train] epoch: 4, step: 1616, loss: 0.18663, accuracy: 0.95 [Train] epoch: 4, step: 1617, loss: 0.04968, accuracy: 1.00 [Train] epoch: 4, step: 1618, loss: 0.70128, accuracy: 0.80 [Train] epoch: 4, step: 1619, loss: 0.52456, accuracy: 0.85 [Train] epoch: 4, step: 1620, loss: 0.14773, accuracy: 0.95 [Train] epoch: 4, step:

[Train] epoch: 4, step: 1906, loss: 0.11912, accuracy: 0.95 [Train] epoch: 4, step: 1907, loss: 0.10388, accuracy: 1.00 [Train] epoch: 4, step: 1908, loss: 0.12527, accuracy: 0.95 [Train] epoch: 4, step: 1909, loss: 0.39160, accuracy: 0.85 [Train] epoch: 4, step: 1910, loss: 0.30602, accuracy: 0.85 [Train] epoch: 4, step: 1911, loss: 0.09099, accuracy: 1.00 [Train] epoch: 4, step: 1912, loss: 0.34212, accuracy: 0.95 [Train] epoch: 4, step: 1913, loss: 0.29015, accuracy: 0.95 [Train] epoch: 4, step: 1914, loss: 0.42161, accuracy: 0.80 [Train] epoch: 4, step: 1915, loss: 0.20177, accuracy: 0.95 [Train] epoch: 4, step: 1916, loss: 0.25288, accuracy: 0.90 [Train] epoch: 4, step: 1917, loss: 0.09183, accuracy: 0.95 [Train] epoch: 4, step: 1918, loss: 0.18579, accuracy: 0.95 [Train] epoch: 4, step: 1919, loss: 0.32843, accuracy: 0.90 [Train] epoch: 4, step: 1920, loss: 0.39318, accuracy: 0.80 [Train] epoch: 4, step: 1921, loss: 0.24919, accuracy: 0.85 [Train] epoch: 4, step:

[Train] epoch: 4, step: 2206, loss: 0.08283, accuracy: 1.00 [Train] epoch: 4, step: 2207, loss: 0.17966, accuracy: 0.95 [Train] epoch: 4, step: 2208, loss: 0.15821, accuracy: 0.95 [Train] epoch: 4, step: 2209, loss: 0.24261, accuracy: 0.95 [Train] epoch: 4, step: 2210, loss: 0.14607, accuracy: 0.95 [Train] epoch: 4, step: 2211, loss: 0.09945, accuracy: 0.95 [Train] epoch: 4, step: 2212, loss: 0.44663, accuracy: 0.85 [Train] epoch: 4, step: 2213, loss: 0.06938, accuracy: 1.00 [Train] epoch: 4, step: 2214, loss: 0.14336, accuracy: 0.95 [Train] epoch: 4, step: 2215, loss: 0.15378, accuracy: 0.95 [Train] epoch: 4, step: 2216, loss: 0.53325, accuracy: 0.80 [Train] epoch: 4, step: 2217, loss: 0.13563, accuracy: 0.95 [Train] epoch: 4, step: 2218, loss: 0.15803, accuracy: 0.95 [Train] epoch: 4, step: 2219, loss: 0.38145, accuracy: 0.85 [Train] epoch: 4, step: 2220, loss: 0.42110, accuracy: 0.90 [Train] epoch: 4, step: 2221, loss: 0.50611, accuracy: 0.80 [Train] epoch: 4, step:

[Train] epoch: 4, step: 2511, loss: 0.39862, accuracy: 0.85 [Train] epoch: 4, step: 2512, loss: 0.28324, accuracy: 0.90 [Train] epoch: 4, step: 2513, loss: 0.29182, accuracy: 0.85 [Train] epoch: 4, step: 2514, loss: 0.18374, accuracy: 1.00 [Train] epoch: 4, step: 2515, loss: 0.27022, accuracy: 0.90 [Train] epoch: 4, step: 2516, loss: 0.33122, accuracy: 0.85 [Train] epoch: 4, step: 2517, loss: 0.45976, accuracy: 0.80 [Train] epoch: 4, step: 2518, loss: 0.24945, accuracy: 0.90 [Train] epoch: 4, step: 2519, loss: 0.34179, accuracy: 0.90 [Train] epoch: 4, step: 2520, loss: 0.11400, accuracy: 0.95 [Train] epoch: 4, step: 2521, loss: 0.32166, accuracy: 0.90 [Train] epoch: 4, step: 2522, loss: 0.20329, accuracy: 0.95 [Train] epoch: 4, step: 2523, loss: 0.35306, accuracy: 0.85 [Train] epoch: 4, step: 2524, loss: 0.32339, accuracy: 0.80 [Train] epoch: 4, step: 2525, loss: 0.08516, accuracy: 1.00 [Train] epoch: 4, step: 2526, loss: 0.19356, accuracy: 0.95 [Train] epoch: 4, step:

[Train] epoch: 5, step: 67, loss: 0.29960, accuracy: 0.85 [Train] epoch: 5, step: 68, loss: 0.06644, accuracy: 1.00 [Train] epoch: 5, step: 69, loss: 0.25758, accuracy: 0.90 [Train] epoch: 5, step: 70, loss: 0.12776, accuracy: 0.95 [Train] epoch: 5, step: 71, loss: 0.37230, accuracy: 0.80 [Train] epoch: 5, step: 72, loss: 0.27515, accuracy: 0.90 [Train] epoch: 5, step: 73, loss: 0.44396, accuracy: 0.80 [Train] epoch: 5, step: 74, loss: 0.29664, accuracy: 0.90 [Train] epoch: 5, step: 75, loss: 0.21321, accuracy: 0.90 [Train] epoch: 5, step: 76, loss: 0.26245, accuracy: 0.85 [Train] epoch: 5, step: 77, loss: 0.11532, accuracy: 0.95 [Train] epoch: 5, step: 78, loss: 0.11709, accuracy: 1.00 [Train] epoch: 5, step: 79, loss: 0.39477, accuracy: 0.90 [Train] epoch: 5, step: 80, loss: 0.34627, accuracy: 0.85 [Train] epoch: 5, step: 81, loss: 0.65613, accuracy: 0.75 [Train] epoch: 5, step: 82, loss: 0.13242, accuracy: 0.95 [Train] epoch: 5, step: 83, loss: 0.35005, accuracy: 0.

[Train] epoch: 5, step: 373, loss: 0.31059, accuracy: 0.85 [Train] epoch: 5, step: 374, loss: 0.27605, accuracy: 0.85 [Train] epoch: 5, step: 375, loss: 0.14038, accuracy: 0.95 [Train] epoch: 5, step: 376, loss: 0.11849, accuracy: 0.95 [Train] epoch: 5, step: 377, loss: 0.09571, accuracy: 0.95 [Train] epoch: 5, step: 378, loss: 0.20119, accuracy: 0.90 [Train] epoch: 5, step: 379, loss: 0.39151, accuracy: 0.75 [Train] epoch: 5, step: 380, loss: 0.21901, accuracy: 0.85 [Train] epoch: 5, step: 381, loss: 0.14169, accuracy: 0.95 [Train] epoch: 5, step: 382, loss: 0.21509, accuracy: 0.85 [Train] epoch: 5, step: 383, loss: 0.19579, accuracy: 0.90 [Train] epoch: 5, step: 384, loss: 0.13601, accuracy: 0.95 [Train] epoch: 5, step: 385, loss: 0.48790, accuracy: 0.80 [Train] epoch: 5, step: 386, loss: 0.28702, accuracy: 0.85 [Train] epoch: 5, step: 387, loss: 0.61370, accuracy: 0.90 [Train] epoch: 5, step: 388, loss: 0.08455, accuracy: 1.00 [Train] epoch: 5, step: 389, loss: 0.25

[Train] epoch: 5, step: 673, loss: 0.56239, accuracy: 0.80 [Train] epoch: 5, step: 674, loss: 0.10094, accuracy: 1.00 [Train] epoch: 5, step: 675, loss: 0.27816, accuracy: 0.90 [Train] epoch: 5, step: 676, loss: 0.05855, accuracy: 1.00 [Train] epoch: 5, step: 677, loss: 0.22773, accuracy: 0.90 [Train] epoch: 5, step: 678, loss: 0.30035, accuracy: 0.90 [Train] epoch: 5, step: 679, loss: 0.24933, accuracy: 0.90 [Train] epoch: 5, step: 680, loss: 0.18515, accuracy: 0.90 [Train] epoch: 5, step: 681, loss: 0.19198, accuracy: 0.90 [Train] epoch: 5, step: 682, loss: 0.01341, accuracy: 1.00 [Train] epoch: 5, step: 683, loss: 0.12686, accuracy: 0.95 [Train] epoch: 5, step: 684, loss: 0.21880, accuracy: 0.95 [Train] epoch: 5, step: 685, loss: 0.20680, accuracy: 0.90 [Train] epoch: 5, step: 686, loss: 0.09518, accuracy: 1.00 [Train] epoch: 5, step: 687, loss: 0.26967, accuracy: 0.85 [Train] epoch: 5, step: 688, loss: 0.15507, accuracy: 0.95 [Train] epoch: 5, step: 689, loss: 0.05

[Train] epoch: 5, step: 979, loss: 0.72363, accuracy: 0.70 [Train] epoch: 5, step: 980, loss: 0.27412, accuracy: 0.85 [Train] epoch: 5, step: 981, loss: 0.38119, accuracy: 0.95 [Train] epoch: 5, step: 982, loss: 0.25895, accuracy: 0.90 [Train] epoch: 5, step: 983, loss: 0.17187, accuracy: 0.90 [Train] epoch: 5, step: 984, loss: 0.03988, accuracy: 1.00 [Train] epoch: 5, step: 985, loss: 0.04518, accuracy: 1.00 [Train] epoch: 5, step: 986, loss: 0.37816, accuracy: 0.85 [Train] epoch: 5, step: 987, loss: 0.22253, accuracy: 0.85 [Train] epoch: 5, step: 988, loss: 0.28277, accuracy: 0.90 [Train] epoch: 5, step: 989, loss: 0.11184, accuracy: 1.00 [Train] epoch: 5, step: 990, loss: 0.61938, accuracy: 0.75 [Train] epoch: 5, step: 991, loss: 0.41980, accuracy: 0.80 [Train] epoch: 5, step: 992, loss: 0.42208, accuracy: 0.80 [Train] epoch: 5, step: 993, loss: 0.10416, accuracy: 0.95 [Train] epoch: 5, step: 994, loss: 0.28101, accuracy: 0.90 [Train] epoch: 5, step: 995, loss: 0.24

[Train] epoch: 5, step: 1283, loss: 0.34764, accuracy: 0.90 [Train] epoch: 5, step: 1284, loss: 0.44613, accuracy: 0.90 [Train] epoch: 5, step: 1285, loss: 0.23826, accuracy: 0.85 [Train] epoch: 5, step: 1286, loss: 0.17509, accuracy: 0.95 [Train] epoch: 5, step: 1287, loss: 0.37656, accuracy: 0.90 [Train] epoch: 5, step: 1288, loss: 0.13215, accuracy: 0.95 [Train] epoch: 5, step: 1289, loss: 0.48417, accuracy: 0.80 [Train] epoch: 5, step: 1290, loss: 0.07937, accuracy: 1.00 [Train] epoch: 5, step: 1291, loss: 0.46171, accuracy: 0.85 [Train] epoch: 5, step: 1292, loss: 0.23717, accuracy: 0.90 [Train] epoch: 5, step: 1293, loss: 0.14233, accuracy: 0.90 [Train] epoch: 5, step: 1294, loss: 0.24333, accuracy: 0.95 [Train] epoch: 5, step: 1295, loss: 0.63018, accuracy: 0.75 [Train] epoch: 5, step: 1296, loss: 0.12137, accuracy: 0.90 [Train] epoch: 5, step: 1297, loss: 0.40836, accuracy: 0.90 [Train] epoch: 5, step: 1298, loss: 0.33303, accuracy: 0.95 [Train] epoch: 5, step:

[Train] epoch: 5, step: 1589, loss: 0.52839, accuracy: 0.85 [Train] epoch: 5, step: 1590, loss: 0.08076, accuracy: 1.00 [Train] epoch: 5, step: 1591, loss: 0.28778, accuracy: 0.85 [Train] epoch: 5, step: 1592, loss: 0.23132, accuracy: 0.85 [Train] epoch: 5, step: 1593, loss: 0.08787, accuracy: 0.90 [Train] epoch: 5, step: 1594, loss: 0.35223, accuracy: 0.80 [Train] epoch: 5, step: 1595, loss: 0.15641, accuracy: 0.95 [Train] epoch: 5, step: 1596, loss: 0.34667, accuracy: 0.75 [Train] epoch: 5, step: 1597, loss: 0.03844, accuracy: 1.00 [Train] epoch: 5, step: 1598, loss: 0.68731, accuracy: 0.80 [Train] epoch: 5, step: 1599, loss: 0.28436, accuracy: 0.85 [Train] epoch: 5, step: 1600, loss: 0.39379, accuracy: 0.85 [Train] epoch: 5, step: 1601, loss: 0.23838, accuracy: 0.85 [Train] epoch: 5, step: 1602, loss: 0.34045, accuracy: 0.95 [Train] epoch: 5, step: 1603, loss: 0.31676, accuracy: 0.85 [Train] epoch: 5, step: 1604, loss: 0.48825, accuracy: 0.90 [Train] epoch: 5, step:

[Train] epoch: 5, step: 1896, loss: 0.22978, accuracy: 0.90 [Train] epoch: 5, step: 1897, loss: 0.22214, accuracy: 0.90 [Train] epoch: 5, step: 1898, loss: 0.08499, accuracy: 1.00 [Train] epoch: 5, step: 1899, loss: 0.32238, accuracy: 0.95 [Train] epoch: 5, step: 1900, loss: 0.23369, accuracy: 0.90 [Train] epoch: 5, step: 1901, loss: 0.22727, accuracy: 0.90 [Train] epoch: 5, step: 1902, loss: 0.21401, accuracy: 0.90 [Train] epoch: 5, step: 1903, loss: 0.18050, accuracy: 0.90 [Train] epoch: 5, step: 1904, loss: 0.39840, accuracy: 0.80 [Train] epoch: 5, step: 1905, loss: 0.12428, accuracy: 0.95 [Train] epoch: 5, step: 1906, loss: 0.09433, accuracy: 0.95 [Train] epoch: 5, step: 1907, loss: 0.13630, accuracy: 1.00 [Train] epoch: 5, step: 1908, loss: 0.14115, accuracy: 0.95 [Train] epoch: 5, step: 1909, loss: 0.42147, accuracy: 0.85 [Train] epoch: 5, step: 1910, loss: 0.33958, accuracy: 0.85 [Train] epoch: 5, step: 1911, loss: 0.09577, accuracy: 1.00 [Train] epoch: 5, step:

[Train] epoch: 5, step: 2204, loss: 0.03867, accuracy: 1.00 [Train] epoch: 5, step: 2205, loss: 0.08415, accuracy: 1.00 [Train] epoch: 5, step: 2206, loss: 0.09146, accuracy: 1.00 [Train] epoch: 5, step: 2207, loss: 0.17022, accuracy: 0.95 [Train] epoch: 5, step: 2208, loss: 0.18879, accuracy: 0.95 [Train] epoch: 5, step: 2209, loss: 0.30836, accuracy: 0.90 [Train] epoch: 5, step: 2210, loss: 0.19689, accuracy: 0.90 [Train] epoch: 5, step: 2211, loss: 0.08048, accuracy: 0.95 [Train] epoch: 5, step: 2212, loss: 0.40609, accuracy: 0.85 [Train] epoch: 5, step: 2213, loss: 0.13544, accuracy: 0.95 [Train] epoch: 5, step: 2214, loss: 0.17934, accuracy: 0.95 [Train] epoch: 5, step: 2215, loss: 0.23002, accuracy: 0.85 [Train] epoch: 5, step: 2216, loss: 0.57664, accuracy: 0.80 [Train] epoch: 5, step: 2217, loss: 0.11901, accuracy: 0.95 [Train] epoch: 5, step: 2218, loss: 0.10223, accuracy: 0.95 [Train] epoch: 5, step: 2219, loss: 0.31543, accuracy: 0.85 [Train] epoch: 5, step:

[Train] epoch: 5, step: 2504, loss: 0.14289, accuracy: 0.95 [Train] epoch: 5, step: 2505, loss: 0.06886, accuracy: 1.00 [Train] epoch: 5, step: 2506, loss: 0.31151, accuracy: 0.85 [Train] epoch: 5, step: 2507, loss: 0.17568, accuracy: 0.90 [Train] epoch: 5, step: 2508, loss: 0.21848, accuracy: 0.95 [Train] epoch: 5, step: 2509, loss: 0.49222, accuracy: 0.85 [Train] epoch: 5, step: 2510, loss: 0.09575, accuracy: 0.95 [Train] epoch: 5, step: 2511, loss: 0.34996, accuracy: 0.90 [Train] epoch: 5, step: 2512, loss: 0.25572, accuracy: 0.90 [Train] epoch: 5, step: 2513, loss: 0.26653, accuracy: 0.95 [Train] epoch: 5, step: 2514, loss: 0.15322, accuracy: 1.00 [Train] epoch: 5, step: 2515, loss: 0.27292, accuracy: 0.90 [Train] epoch: 5, step: 2516, loss: 0.22350, accuracy: 0.95 [Train] epoch: 5, step: 2517, loss: 0.39177, accuracy: 0.80 [Train] epoch: 5, step: 2518, loss: 0.27818, accuracy: 0.90 [Train] epoch: 5, step: 2519, loss: 0.24136, accuracy: 0.95 [Train] epoch: 5, step:

[Train] epoch: 6, step: 50, loss: 0.21478, accuracy: 0.90 [Train] epoch: 6, step: 51, loss: 0.10617, accuracy: 0.95 [Train] epoch: 6, step: 52, loss: 0.19593, accuracy: 0.95 [Train] epoch: 6, step: 53, loss: 0.28638, accuracy: 0.95 [Train] epoch: 6, step: 54, loss: 0.57161, accuracy: 0.85 [Train] epoch: 6, step: 55, loss: 0.29781, accuracy: 0.95 [Train] epoch: 6, step: 56, loss: 0.14041, accuracy: 0.95 [Train] epoch: 6, step: 57, loss: 0.19589, accuracy: 0.90 [Train] epoch: 6, step: 58, loss: 0.14066, accuracy: 0.95 [Train] epoch: 6, step: 59, loss: 0.14467, accuracy: 0.95 [Train] epoch: 6, step: 60, loss: 0.13918, accuracy: 0.95 [Train] epoch: 6, step: 61, loss: 0.29773, accuracy: 0.85 [Train] epoch: 6, step: 62, loss: 0.13947, accuracy: 0.90 [Train] epoch: 6, step: 63, loss: 0.45708, accuracy: 0.80 [Train] epoch: 6, step: 64, loss: 0.38931, accuracy: 0.85 [Train] epoch: 6, step: 65, loss: 0.13069, accuracy: 0.95 [Train] epoch: 6, step: 66, loss: 0.13670, accuracy: 0.

[Train] epoch: 6, step: 356, loss: 0.27683, accuracy: 0.90 [Train] epoch: 6, step: 357, loss: 0.41272, accuracy: 0.75 [Train] epoch: 6, step: 358, loss: 0.05794, accuracy: 1.00 [Train] epoch: 6, step: 359, loss: 0.55931, accuracy: 0.75 [Train] epoch: 6, step: 360, loss: 0.32972, accuracy: 0.95 [Train] epoch: 6, step: 361, loss: 0.24519, accuracy: 0.90 [Train] epoch: 6, step: 362, loss: 0.16668, accuracy: 0.95 [Train] epoch: 6, step: 363, loss: 0.15463, accuracy: 0.95 [Train] epoch: 6, step: 364, loss: 0.37276, accuracy: 0.85 [Train] epoch: 6, step: 365, loss: 0.19146, accuracy: 0.90 [Train] epoch: 6, step: 366, loss: 0.22737, accuracy: 0.95 [Train] epoch: 6, step: 367, loss: 0.16607, accuracy: 0.95 [Train] epoch: 6, step: 368, loss: 0.22870, accuracy: 0.95 [Train] epoch: 6, step: 369, loss: 0.35741, accuracy: 0.85 [Train] epoch: 6, step: 370, loss: 0.51808, accuracy: 0.75 [Train] epoch: 6, step: 371, loss: 0.50035, accuracy: 0.85 [Train] epoch: 6, step: 372, loss: 0.12

[Train] epoch: 6, step: 661, loss: 0.05056, accuracy: 1.00 [Train] epoch: 6, step: 662, loss: 0.63181, accuracy: 0.80 [Train] epoch: 6, step: 663, loss: 0.40498, accuracy: 0.90 [Train] epoch: 6, step: 664, loss: 0.42731, accuracy: 0.85 [Train] epoch: 6, step: 665, loss: 0.11526, accuracy: 0.95 [Train] epoch: 6, step: 666, loss: 0.15400, accuracy: 0.95 [Train] epoch: 6, step: 667, loss: 0.23095, accuracy: 0.85 [Train] epoch: 6, step: 668, loss: 0.15239, accuracy: 0.95 [Train] epoch: 6, step: 669, loss: 0.55500, accuracy: 0.85 [Train] epoch: 6, step: 670, loss: 0.25051, accuracy: 0.90 [Train] epoch: 6, step: 671, loss: 0.47367, accuracy: 0.90 [Train] epoch: 6, step: 672, loss: 0.21797, accuracy: 0.85 [Train] epoch: 6, step: 673, loss: 0.78349, accuracy: 0.75 [Train] epoch: 6, step: 674, loss: 0.21191, accuracy: 0.90 [Train] epoch: 6, step: 675, loss: 0.14173, accuracy: 0.95 [Train] epoch: 6, step: 676, loss: 0.12997, accuracy: 1.00 [Train] epoch: 6, step: 677, loss: 0.26

[Train] epoch: 6, step: 964, loss: 0.22848, accuracy: 0.90 [Train] epoch: 6, step: 965, loss: 0.50049, accuracy: 0.85 [Train] epoch: 6, step: 966, loss: 0.43352, accuracy: 0.90 [Train] epoch: 6, step: 967, loss: 0.40462, accuracy: 0.95 [Train] epoch: 6, step: 968, loss: 0.25511, accuracy: 0.90 [Train] epoch: 6, step: 969, loss: 0.08483, accuracy: 0.95 [Train] epoch: 6, step: 970, loss: 0.23446, accuracy: 0.95 [Train] epoch: 6, step: 971, loss: 0.27813, accuracy: 0.90 [Train] epoch: 6, step: 972, loss: 0.41157, accuracy: 0.85 [Train] epoch: 6, step: 973, loss: 0.09408, accuracy: 1.00 [Train] epoch: 6, step: 974, loss: 0.22813, accuracy: 0.95 [Train] epoch: 6, step: 975, loss: 0.54834, accuracy: 0.80 [Train] epoch: 6, step: 976, loss: 0.21931, accuracy: 0.95 [Train] epoch: 6, step: 977, loss: 0.26527, accuracy: 0.90 [Train] epoch: 6, step: 978, loss: 0.30247, accuracy: 0.90 [Train] epoch: 6, step: 979, loss: 0.68035, accuracy: 0.80 [Train] epoch: 6, step: 980, loss: 0.19

[Train] epoch: 6, step: 1266, loss: 0.28916, accuracy: 0.80 [Train] epoch: 6, step: 1267, loss: 0.29759, accuracy: 0.85 [Train] epoch: 6, step: 1268, loss: 0.07243, accuracy: 1.00 [Train] epoch: 6, step: 1269, loss: 0.14011, accuracy: 0.95 [Train] epoch: 6, step: 1270, loss: 0.24584, accuracy: 0.90 [Train] epoch: 6, step: 1271, loss: 0.14143, accuracy: 0.95 [Train] epoch: 6, step: 1272, loss: 0.19526, accuracy: 0.95 [Train] epoch: 6, step: 1273, loss: 0.14397, accuracy: 0.95 [Train] epoch: 6, step: 1274, loss: 0.37772, accuracy: 0.90 [Train] epoch: 6, step: 1275, loss: 0.19041, accuracy: 0.95 [Train] epoch: 6, step: 1276, loss: 0.04420, accuracy: 1.00 [Train] epoch: 6, step: 1277, loss: 0.26682, accuracy: 0.90 [Train] epoch: 6, step: 1278, loss: 0.13468, accuracy: 0.95 [Train] epoch: 6, step: 1279, loss: 0.22199, accuracy: 0.90 [Train] epoch: 6, step: 1280, loss: 0.55593, accuracy: 0.85 [Train] epoch: 6, step: 1281, loss: 0.21418, accuracy: 0.90 [Train] epoch: 6, step:

[Train] epoch: 6, step: 1572, loss: 0.31326, accuracy: 0.90 [Train] epoch: 6, step: 1573, loss: 0.35499, accuracy: 0.90 [Train] epoch: 6, step: 1574, loss: 0.38358, accuracy: 0.85 [Train] epoch: 6, step: 1575, loss: 0.69296, accuracy: 0.75 [Train] epoch: 6, step: 1576, loss: 0.19327, accuracy: 0.90 [Train] epoch: 6, step: 1577, loss: 0.11126, accuracy: 0.95 [Train] epoch: 6, step: 1578, loss: 0.43828, accuracy: 0.85 [Train] epoch: 6, step: 1579, loss: 0.13686, accuracy: 0.90 [Train] epoch: 6, step: 1580, loss: 0.22395, accuracy: 0.90 [Train] epoch: 6, step: 1581, loss: 0.23694, accuracy: 0.95 [Train] epoch: 6, step: 1582, loss: 0.33077, accuracy: 0.90 [Train] epoch: 6, step: 1583, loss: 0.18289, accuracy: 0.95 [Train] epoch: 6, step: 1584, loss: 0.21899, accuracy: 0.90 [Train] epoch: 6, step: 1585, loss: 0.68577, accuracy: 0.80 [Train] epoch: 6, step: 1586, loss: 0.17659, accuracy: 0.95 [Train] epoch: 6, step: 1587, loss: 0.16319, accuracy: 0.95 [Train] epoch: 6, step:

[Train] epoch: 6, step: 1876, loss: 0.33999, accuracy: 0.85 [Train] epoch: 6, step: 1877, loss: 0.07912, accuracy: 1.00 [Train] epoch: 6, step: 1878, loss: 0.08808, accuracy: 0.95 [Train] epoch: 6, step: 1879, loss: 0.22648, accuracy: 0.95 [Train] epoch: 6, step: 1880, loss: 0.21015, accuracy: 0.90 [Train] epoch: 6, step: 1881, loss: 0.03661, accuracy: 1.00 [Train] epoch: 6, step: 1882, loss: 0.14535, accuracy: 0.95 [Train] epoch: 6, step: 1883, loss: 0.06133, accuracy: 1.00 [Train] epoch: 6, step: 1884, loss: 0.38021, accuracy: 0.85 [Train] epoch: 6, step: 1885, loss: 0.17425, accuracy: 0.90 [Train] epoch: 6, step: 1886, loss: 0.40436, accuracy: 0.90 [Train] epoch: 6, step: 1887, loss: 0.17730, accuracy: 0.85 [Train] epoch: 6, step: 1888, loss: 0.22606, accuracy: 0.90 [Train] epoch: 6, step: 1889, loss: 0.47614, accuracy: 0.95 [Train] epoch: 6, step: 1890, loss: 0.24147, accuracy: 0.85 [Train] epoch: 6, step: 1891, loss: 0.17800, accuracy: 0.85 [Train] epoch: 6, step:

[Train] epoch: 6, step: 2181, loss: 0.44654, accuracy: 0.85 [Train] epoch: 6, step: 2182, loss: 0.20089, accuracy: 0.90 [Train] epoch: 6, step: 2183, loss: 0.12483, accuracy: 0.95 [Train] epoch: 6, step: 2184, loss: 0.22832, accuracy: 0.95 [Train] epoch: 6, step: 2185, loss: 0.17466, accuracy: 0.95 [Train] epoch: 6, step: 2186, loss: 0.29193, accuracy: 0.85 [Train] epoch: 6, step: 2187, loss: 0.31330, accuracy: 0.90 [Train] epoch: 6, step: 2188, loss: 0.11626, accuracy: 0.95 [Train] epoch: 6, step: 2189, loss: 0.15315, accuracy: 0.95 [Train] epoch: 6, step: 2190, loss: 0.11575, accuracy: 0.95 [Train] epoch: 6, step: 2191, loss: 0.15628, accuracy: 0.95 [Train] epoch: 6, step: 2192, loss: 0.29978, accuracy: 0.90 [Train] epoch: 6, step: 2193, loss: 0.09666, accuracy: 0.95 [Train] epoch: 6, step: 2194, loss: 0.20291, accuracy: 0.90 [Train] epoch: 6, step: 2195, loss: 0.37512, accuracy: 0.90 [Train] epoch: 6, step: 2196, loss: 0.15106, accuracy: 0.95 [Train] epoch: 6, step:

[Train] epoch: 6, step: 2483, loss: 0.06969, accuracy: 1.00 [Train] epoch: 6, step: 2484, loss: 0.22903, accuracy: 0.90 [Train] epoch: 6, step: 2485, loss: 0.16607, accuracy: 0.90 [Train] epoch: 6, step: 2486, loss: 0.11932, accuracy: 0.95 [Train] epoch: 6, step: 2487, loss: 0.32139, accuracy: 0.90 [Train] epoch: 6, step: 2488, loss: 0.16417, accuracy: 0.95 [Train] epoch: 6, step: 2489, loss: 0.20668, accuracy: 0.90 [Train] epoch: 6, step: 2490, loss: 0.13724, accuracy: 0.95 [Train] epoch: 6, step: 2491, loss: 0.30803, accuracy: 0.90 [Train] epoch: 6, step: 2492, loss: 0.15888, accuracy: 0.95 [Train] epoch: 6, step: 2493, loss: 0.14977, accuracy: 0.95 [Train] epoch: 6, step: 2494, loss: 0.13074, accuracy: 0.95 [Train] epoch: 6, step: 2495, loss: 0.12861, accuracy: 0.95 [Train] epoch: 6, step: 2496, loss: 0.18223, accuracy: 0.90 [Train] epoch: 6, step: 2497, loss: 0.09609, accuracy: 1.00 [Train] epoch: 6, step: 2498, loss: 0.64072, accuracy: 0.75 [Train] epoch: 6, step:

[Train] epoch: 7, step: 40, loss: 0.10345, accuracy: 0.95 [Train] epoch: 7, step: 41, loss: 0.30709, accuracy: 0.90 [Train] epoch: 7, step: 42, loss: 0.10892, accuracy: 0.95 [Train] epoch: 7, step: 43, loss: 0.34317, accuracy: 0.90 [Train] epoch: 7, step: 44, loss: 0.03974, accuracy: 1.00 [Train] epoch: 7, step: 45, loss: 0.10194, accuracy: 1.00 [Train] epoch: 7, step: 46, loss: 0.23253, accuracy: 0.85 [Train] epoch: 7, step: 47, loss: 0.33314, accuracy: 0.80 [Train] epoch: 7, step: 48, loss: 0.10811, accuracy: 0.95 [Train] epoch: 7, step: 49, loss: 0.37466, accuracy: 0.90 [Train] epoch: 7, step: 50, loss: 0.20250, accuracy: 0.90 [Train] epoch: 7, step: 51, loss: 0.09977, accuracy: 0.95 [Train] epoch: 7, step: 52, loss: 0.16854, accuracy: 0.95 [Train] epoch: 7, step: 53, loss: 0.21725, accuracy: 0.95 [Train] epoch: 7, step: 54, loss: 0.46330, accuracy: 0.85 [Train] epoch: 7, step: 55, loss: 0.59501, accuracy: 0.90 [Train] epoch: 7, step: 56, loss: 0.22389, accuracy: 0.

[Train] epoch: 7, step: 346, loss: 0.17041, accuracy: 0.85 [Train] epoch: 7, step: 347, loss: 0.18965, accuracy: 0.95 [Train] epoch: 7, step: 348, loss: 0.06567, accuracy: 1.00 [Train] epoch: 7, step: 349, loss: 0.50121, accuracy: 0.85 [Train] epoch: 7, step: 350, loss: 0.19596, accuracy: 0.95 [Train] epoch: 7, step: 351, loss: 0.08442, accuracy: 1.00 [Train] epoch: 7, step: 352, loss: 0.07165, accuracy: 0.95 [Train] epoch: 7, step: 353, loss: 0.28421, accuracy: 0.90 [Train] epoch: 7, step: 354, loss: 0.24222, accuracy: 0.90 [Train] epoch: 7, step: 355, loss: 0.15797, accuracy: 0.90 [Train] epoch: 7, step: 356, loss: 0.34432, accuracy: 0.85 [Train] epoch: 7, step: 357, loss: 0.49348, accuracy: 0.85 [Train] epoch: 7, step: 358, loss: 0.03604, accuracy: 1.00 [Train] epoch: 7, step: 359, loss: 0.43510, accuracy: 0.85 [Train] epoch: 7, step: 360, loss: 0.29795, accuracy: 0.95 [Train] epoch: 7, step: 361, loss: 0.27236, accuracy: 0.85 [Train] epoch: 7, step: 362, loss: 0.12

[Train] epoch: 7, step: 653, loss: 0.19168, accuracy: 0.90 [Train] epoch: 7, step: 654, loss: 0.21811, accuracy: 0.90 [Train] epoch: 7, step: 655, loss: 0.25464, accuracy: 0.90 [Train] epoch: 7, step: 656, loss: 0.33736, accuracy: 0.85 [Train] epoch: 7, step: 657, loss: 0.32184, accuracy: 0.90 [Train] epoch: 7, step: 658, loss: 0.16893, accuracy: 0.95 [Train] epoch: 7, step: 659, loss: 0.69540, accuracy: 0.75 [Train] epoch: 7, step: 660, loss: 0.19351, accuracy: 0.95 [Train] epoch: 7, step: 661, loss: 0.05005, accuracy: 1.00 [Train] epoch: 7, step: 662, loss: 0.60069, accuracy: 0.80 [Train] epoch: 7, step: 663, loss: 0.44184, accuracy: 0.90 [Train] epoch: 7, step: 664, loss: 0.22896, accuracy: 1.00 [Train] epoch: 7, step: 665, loss: 0.07030, accuracy: 1.00 [Train] epoch: 7, step: 666, loss: 0.11660, accuracy: 0.95 [Train] epoch: 7, step: 667, loss: 0.22521, accuracy: 0.90 [Train] epoch: 7, step: 668, loss: 0.15270, accuracy: 0.90 [Train] epoch: 7, step: 669, loss: 0.58

[Train] epoch: 7, step: 956, loss: 0.06768, accuracy: 1.00 [Train] epoch: 7, step: 957, loss: 0.27738, accuracy: 0.85 [Train] epoch: 7, step: 958, loss: 0.11073, accuracy: 0.95 [Train] epoch: 7, step: 959, loss: 0.21011, accuracy: 0.90 [Train] epoch: 7, step: 960, loss: 0.19763, accuracy: 0.95 [Train] epoch: 7, step: 961, loss: 0.15542, accuracy: 0.95 [Train] epoch: 7, step: 962, loss: 0.14933, accuracy: 0.95 [Train] epoch: 7, step: 963, loss: 0.23871, accuracy: 0.85 [Train] epoch: 7, step: 964, loss: 0.25459, accuracy: 0.90 [Train] epoch: 7, step: 965, loss: 0.25995, accuracy: 0.90 [Train] epoch: 7, step: 966, loss: 0.49029, accuracy: 0.85 [Train] epoch: 7, step: 967, loss: 0.44137, accuracy: 0.90 [Train] epoch: 7, step: 968, loss: 0.17226, accuracy: 0.95 [Train] epoch: 7, step: 969, loss: 0.09083, accuracy: 0.95 [Train] epoch: 7, step: 970, loss: 0.34879, accuracy: 0.85 [Train] epoch: 7, step: 971, loss: 0.21738, accuracy: 0.95 [Train] epoch: 7, step: 972, loss: 0.37

[Train] epoch: 7, step: 1261, loss: 0.12966, accuracy: 0.95 [Train] epoch: 7, step: 1262, loss: 0.12297, accuracy: 1.00 [Train] epoch: 7, step: 1263, loss: 0.11230, accuracy: 0.95 [Train] epoch: 7, step: 1264, loss: 0.30535, accuracy: 0.85 [Train] epoch: 7, step: 1265, loss: 0.11276, accuracy: 0.95 [Train] epoch: 7, step: 1266, loss: 0.27019, accuracy: 0.85 [Train] epoch: 7, step: 1267, loss: 0.27437, accuracy: 0.85 [Train] epoch: 7, step: 1268, loss: 0.06333, accuracy: 1.00 [Train] epoch: 7, step: 1269, loss: 0.10598, accuracy: 0.95 [Train] epoch: 7, step: 1270, loss: 0.20732, accuracy: 0.90 [Train] epoch: 7, step: 1271, loss: 0.15503, accuracy: 0.90 [Train] epoch: 7, step: 1272, loss: 0.16484, accuracy: 0.95 [Train] epoch: 7, step: 1273, loss: 0.14552, accuracy: 0.90 [Train] epoch: 7, step: 1274, loss: 0.38258, accuracy: 0.90 [Train] epoch: 7, step: 1275, loss: 0.24139, accuracy: 0.90 [Train] epoch: 7, step: 1276, loss: 0.04659, accuracy: 1.00 [Train] epoch: 7, step:

[Train] epoch: 7, step: 1568, loss: 0.21376, accuracy: 0.90 [Train] epoch: 7, step: 1569, loss: 0.13583, accuracy: 1.00 [Train] epoch: 7, step: 1570, loss: 0.35718, accuracy: 0.85 [Train] epoch: 7, step: 1571, loss: 0.36635, accuracy: 0.85 [Train] epoch: 7, step: 1572, loss: 0.37745, accuracy: 0.85 [Train] epoch: 7, step: 1573, loss: 0.31178, accuracy: 0.90 [Train] epoch: 7, step: 1574, loss: 0.31261, accuracy: 0.85 [Train] epoch: 7, step: 1575, loss: 0.46800, accuracy: 0.80 [Train] epoch: 7, step: 1576, loss: 0.20977, accuracy: 0.90 [Train] epoch: 7, step: 1577, loss: 0.13708, accuracy: 0.95 [Train] epoch: 7, step: 1578, loss: 0.35449, accuracy: 0.85 [Train] epoch: 7, step: 1579, loss: 0.11771, accuracy: 0.95 [Train] epoch: 7, step: 1580, loss: 0.18339, accuracy: 0.95 [Train] epoch: 7, step: 1581, loss: 0.25676, accuracy: 0.90 [Train] epoch: 7, step: 1582, loss: 0.29890, accuracy: 0.90 [Train] epoch: 7, step: 1583, loss: 0.19648, accuracy: 0.95 [Train] epoch: 7, step:

[Train] epoch: 7, step: 1877, loss: 0.08628, accuracy: 1.00 [Train] epoch: 7, step: 1878, loss: 0.09227, accuracy: 0.95 [Train] epoch: 7, step: 1879, loss: 0.20546, accuracy: 0.95 [Train] epoch: 7, step: 1880, loss: 0.22125, accuracy: 0.90 [Train] epoch: 7, step: 1881, loss: 0.04210, accuracy: 1.00 [Train] epoch: 7, step: 1882, loss: 0.18275, accuracy: 0.95 [Train] epoch: 7, step: 1883, loss: 0.02919, accuracy: 1.00 [Train] epoch: 7, step: 1884, loss: 0.34505, accuracy: 0.90 [Train] epoch: 7, step: 1885, loss: 0.13824, accuracy: 0.90 [Train] epoch: 7, step: 1886, loss: 0.37012, accuracy: 0.85 [Train] epoch: 7, step: 1887, loss: 0.16644, accuracy: 0.90 [Train] epoch: 7, step: 1888, loss: 0.20280, accuracy: 0.90 [Train] epoch: 7, step: 1889, loss: 0.17765, accuracy: 0.90 [Train] epoch: 7, step: 1890, loss: 0.26277, accuracy: 0.85 [Train] epoch: 7, step: 1891, loss: 0.14964, accuracy: 0.95 [Train] epoch: 7, step: 1892, loss: 0.05236, accuracy: 1.00 [Train] epoch: 7, step:

[Train] epoch: 7, step: 2181, loss: 0.45526, accuracy: 0.80 [Train] epoch: 7, step: 2182, loss: 0.17394, accuracy: 0.95 [Train] epoch: 7, step: 2183, loss: 0.12060, accuracy: 1.00 [Train] epoch: 7, step: 2184, loss: 0.22449, accuracy: 0.95 [Train] epoch: 7, step: 2185, loss: 0.12894, accuracy: 0.95 [Train] epoch: 7, step: 2186, loss: 0.35330, accuracy: 0.85 [Train] epoch: 7, step: 2187, loss: 0.38119, accuracy: 0.85 [Train] epoch: 7, step: 2188, loss: 0.08093, accuracy: 1.00 [Train] epoch: 7, step: 2189, loss: 0.21034, accuracy: 0.95 [Train] epoch: 7, step: 2190, loss: 0.10274, accuracy: 0.95 [Train] epoch: 7, step: 2191, loss: 0.18269, accuracy: 0.85 [Train] epoch: 7, step: 2192, loss: 0.22192, accuracy: 0.90 [Train] epoch: 7, step: 2193, loss: 0.09121, accuracy: 0.95 [Train] epoch: 7, step: 2194, loss: 0.14147, accuracy: 0.95 [Train] epoch: 7, step: 2195, loss: 0.35988, accuracy: 0.90 [Train] epoch: 7, step: 2196, loss: 0.03217, accuracy: 1.00 [Train] epoch: 7, step:

[Train] epoch: 7, step: 2486, loss: 0.12297, accuracy: 0.95 [Train] epoch: 7, step: 2487, loss: 0.38171, accuracy: 0.90 [Train] epoch: 7, step: 2488, loss: 0.18157, accuracy: 0.85 [Train] epoch: 7, step: 2489, loss: 0.17657, accuracy: 0.90 [Train] epoch: 7, step: 2490, loss: 0.14257, accuracy: 0.95 [Train] epoch: 7, step: 2491, loss: 0.27921, accuracy: 0.90 [Train] epoch: 7, step: 2492, loss: 0.09263, accuracy: 1.00 [Train] epoch: 7, step: 2493, loss: 0.12347, accuracy: 1.00 [Train] epoch: 7, step: 2494, loss: 0.12995, accuracy: 0.95 [Train] epoch: 7, step: 2495, loss: 0.12197, accuracy: 0.95 [Train] epoch: 7, step: 2496, loss: 0.14076, accuracy: 0.90 [Train] epoch: 7, step: 2497, loss: 0.08060, accuracy: 1.00 [Train] epoch: 7, step: 2498, loss: 0.55626, accuracy: 0.75 [Train] epoch: 7, step: 2499, loss: 0.46851, accuracy: 0.90 [Train] epoch: 7, step: 2500, loss: 0.80757, accuracy: 0.75 [Train] epoch: 7, step: 2501, loss: 0.33176, accuracy: 0.85 [Train] epoch: 7, step:

[Train] epoch: 8, step: 42, loss: 0.09504, accuracy: 0.95 [Train] epoch: 8, step: 43, loss: 0.34075, accuracy: 0.90 [Train] epoch: 8, step: 44, loss: 0.04341, accuracy: 1.00 [Train] epoch: 8, step: 45, loss: 0.15679, accuracy: 0.95 [Train] epoch: 8, step: 46, loss: 0.22826, accuracy: 0.90 [Train] epoch: 8, step: 47, loss: 0.33011, accuracy: 0.80 [Train] epoch: 8, step: 48, loss: 0.13344, accuracy: 0.90 [Train] epoch: 8, step: 49, loss: 0.27123, accuracy: 0.90 [Train] epoch: 8, step: 50, loss: 0.26016, accuracy: 0.90 [Train] epoch: 8, step: 51, loss: 0.05901, accuracy: 1.00 [Train] epoch: 8, step: 52, loss: 0.17006, accuracy: 0.95 [Train] epoch: 8, step: 53, loss: 0.18806, accuracy: 0.95 [Train] epoch: 8, step: 54, loss: 0.45607, accuracy: 0.90 [Train] epoch: 8, step: 55, loss: 0.32430, accuracy: 0.95 [Train] epoch: 8, step: 56, loss: 0.15038, accuracy: 0.95 [Train] epoch: 8, step: 57, loss: 0.20472, accuracy: 0.90 [Train] epoch: 8, step: 58, loss: 0.33962, accuracy: 0.

[Train] epoch: 8, step: 347, loss: 0.14142, accuracy: 0.95 [Train] epoch: 8, step: 348, loss: 0.06695, accuracy: 1.00 [Train] epoch: 8, step: 349, loss: 0.22072, accuracy: 0.90 [Train] epoch: 8, step: 350, loss: 0.13267, accuracy: 0.95 [Train] epoch: 8, step: 351, loss: 0.07053, accuracy: 1.00 [Train] epoch: 8, step: 352, loss: 0.02985, accuracy: 1.00 [Train] epoch: 8, step: 353, loss: 0.20271, accuracy: 0.85 [Train] epoch: 8, step: 354, loss: 0.33237, accuracy: 0.85 [Train] epoch: 8, step: 355, loss: 0.07331, accuracy: 0.95 [Train] epoch: 8, step: 356, loss: 0.34024, accuracy: 0.85 [Train] epoch: 8, step: 357, loss: 0.46851, accuracy: 0.80 [Train] epoch: 8, step: 358, loss: 0.05376, accuracy: 1.00 [Train] epoch: 8, step: 359, loss: 0.44702, accuracy: 0.80 [Train] epoch: 8, step: 360, loss: 0.22461, accuracy: 0.95 [Train] epoch: 8, step: 361, loss: 0.22974, accuracy: 0.85 [Train] epoch: 8, step: 362, loss: 0.10297, accuracy: 0.95 [Train] epoch: 8, step: 363, loss: 0.09

[Train] epoch: 8, step: 655, loss: 0.16981, accuracy: 0.95 [Train] epoch: 8, step: 656, loss: 0.21989, accuracy: 0.85 [Train] epoch: 8, step: 657, loss: 0.23216, accuracy: 0.90 [Train] epoch: 8, step: 658, loss: 0.17014, accuracy: 0.95 [Train] epoch: 8, step: 659, loss: 0.57618, accuracy: 0.80 [Train] epoch: 8, step: 660, loss: 0.16788, accuracy: 0.95 [Train] epoch: 8, step: 661, loss: 0.03823, accuracy: 1.00 [Train] epoch: 8, step: 662, loss: 0.47958, accuracy: 0.80 [Train] epoch: 8, step: 663, loss: 0.61354, accuracy: 0.85 [Train] epoch: 8, step: 664, loss: 0.43793, accuracy: 0.85 [Train] epoch: 8, step: 665, loss: 0.05585, accuracy: 1.00 [Train] epoch: 8, step: 666, loss: 0.10387, accuracy: 1.00 [Train] epoch: 8, step: 667, loss: 0.20540, accuracy: 0.95 [Train] epoch: 8, step: 668, loss: 0.08822, accuracy: 1.00 [Train] epoch: 8, step: 669, loss: 0.47414, accuracy: 0.80 [Train] epoch: 8, step: 670, loss: 0.17349, accuracy: 0.95 [Train] epoch: 8, step: 671, loss: 0.37

[Train] epoch: 8, step: 962, loss: 0.12375, accuracy: 0.95 [Train] epoch: 8, step: 963, loss: 0.35189, accuracy: 0.75 [Train] epoch: 8, step: 964, loss: 0.27582, accuracy: 0.90 [Train] epoch: 8, step: 965, loss: 0.25620, accuracy: 0.90 [Train] epoch: 8, step: 966, loss: 0.47163, accuracy: 0.85 [Train] epoch: 8, step: 967, loss: 0.36861, accuracy: 0.95 [Train] epoch: 8, step: 968, loss: 0.20470, accuracy: 0.90 [Train] epoch: 8, step: 969, loss: 0.06888, accuracy: 0.95 [Train] epoch: 8, step: 970, loss: 0.30922, accuracy: 0.90 [Train] epoch: 8, step: 971, loss: 0.19780, accuracy: 0.90 [Train] epoch: 8, step: 972, loss: 0.30811, accuracy: 0.90 [Train] epoch: 8, step: 973, loss: 0.06163, accuracy: 1.00 [Train] epoch: 8, step: 974, loss: 0.07018, accuracy: 1.00 [Train] epoch: 8, step: 975, loss: 0.38267, accuracy: 0.90 [Train] epoch: 8, step: 976, loss: 0.26478, accuracy: 0.95 [Train] epoch: 8, step: 977, loss: 0.18234, accuracy: 0.95 [Train] epoch: 8, step: 978, loss: 0.21

[Train] epoch: 8, step: 1270, loss: 0.17889, accuracy: 0.90 [Train] epoch: 8, step: 1271, loss: 0.09690, accuracy: 0.95 [Train] epoch: 8, step: 1272, loss: 0.20418, accuracy: 0.95 [Train] epoch: 8, step: 1273, loss: 0.13590, accuracy: 0.95 [Train] epoch: 8, step: 1274, loss: 0.41315, accuracy: 0.90 [Train] epoch: 8, step: 1275, loss: 0.19210, accuracy: 0.90 [Train] epoch: 8, step: 1276, loss: 0.06616, accuracy: 1.00 [Train] epoch: 8, step: 1277, loss: 0.28311, accuracy: 0.90 [Train] epoch: 8, step: 1278, loss: 0.13753, accuracy: 0.95 [Train] epoch: 8, step: 1279, loss: 0.15790, accuracy: 0.90 [Train] epoch: 8, step: 1280, loss: 0.72597, accuracy: 0.85 [Train] epoch: 8, step: 1281, loss: 0.17868, accuracy: 0.95 [Train] epoch: 8, step: 1282, loss: 0.08337, accuracy: 1.00 [Train] epoch: 8, step: 1283, loss: 0.44408, accuracy: 0.85 [Train] epoch: 8, step: 1284, loss: 0.30903, accuracy: 0.90 [Train] epoch: 8, step: 1285, loss: 0.10649, accuracy: 0.95 [Train] epoch: 8, step:

[Train] epoch: 8, step: 1576, loss: 0.20548, accuracy: 0.95 [Train] epoch: 8, step: 1577, loss: 0.11552, accuracy: 0.95 [Train] epoch: 8, step: 1578, loss: 0.24494, accuracy: 0.90 [Train] epoch: 8, step: 1579, loss: 0.14167, accuracy: 0.85 [Train] epoch: 8, step: 1580, loss: 0.18913, accuracy: 0.95 [Train] epoch: 8, step: 1581, loss: 0.21957, accuracy: 0.85 [Train] epoch: 8, step: 1582, loss: 0.49380, accuracy: 0.85 [Train] epoch: 8, step: 1583, loss: 0.13113, accuracy: 0.95 [Train] epoch: 8, step: 1584, loss: 0.20033, accuracy: 0.85 [Train] epoch: 8, step: 1585, loss: 0.81850, accuracy: 0.85 [Train] epoch: 8, step: 1586, loss: 0.12278, accuracy: 0.95 [Train] epoch: 8, step: 1587, loss: 0.10710, accuracy: 0.95 [Train] epoch: 8, step: 1588, loss: 0.10356, accuracy: 1.00 [Train] epoch: 8, step: 1589, loss: 0.66110, accuracy: 0.80 [Train] epoch: 8, step: 1590, loss: 0.09149, accuracy: 0.95 [Train] epoch: 8, step: 1591, loss: 0.25617, accuracy: 0.85 [Train] epoch: 8, step:

[Train] epoch: 8, step: 1878, loss: 0.13145, accuracy: 0.90 [Train] epoch: 8, step: 1879, loss: 0.13140, accuracy: 0.95 [Train] epoch: 8, step: 1880, loss: 0.17676, accuracy: 0.95 [Train] epoch: 8, step: 1881, loss: 0.05798, accuracy: 1.00 [Train] epoch: 8, step: 1882, loss: 0.15355, accuracy: 0.95 [Train] epoch: 8, step: 1883, loss: 0.05621, accuracy: 1.00 [Train] epoch: 8, step: 1884, loss: 0.29022, accuracy: 0.90 [Train] epoch: 8, step: 1885, loss: 0.10333, accuracy: 0.90 [Train] epoch: 8, step: 1886, loss: 0.31906, accuracy: 0.95 [Train] epoch: 8, step: 1887, loss: 0.15293, accuracy: 0.95 [Train] epoch: 8, step: 1888, loss: 0.28753, accuracy: 0.90 [Train] epoch: 8, step: 1889, loss: 0.18409, accuracy: 0.85 [Train] epoch: 8, step: 1890, loss: 0.24874, accuracy: 0.90 [Train] epoch: 8, step: 1891, loss: 0.15806, accuracy: 0.90 [Train] epoch: 8, step: 1892, loss: 0.04472, accuracy: 1.00 [Train] epoch: 8, step: 1893, loss: 0.36665, accuracy: 0.90 [Train] epoch: 8, step:

[Train] epoch: 8, step: 2180, loss: 0.24168, accuracy: 0.80 [Train] epoch: 8, step: 2181, loss: 0.35589, accuracy: 0.85 [Train] epoch: 8, step: 2182, loss: 0.33006, accuracy: 0.90 [Train] epoch: 8, step: 2183, loss: 0.10253, accuracy: 0.95 [Train] epoch: 8, step: 2184, loss: 0.22523, accuracy: 0.95 [Train] epoch: 8, step: 2185, loss: 0.15037, accuracy: 0.95 [Train] epoch: 8, step: 2186, loss: 0.29511, accuracy: 0.85 [Train] epoch: 8, step: 2187, loss: 0.36645, accuracy: 0.85 [Train] epoch: 8, step: 2188, loss: 0.14766, accuracy: 0.95 [Train] epoch: 8, step: 2189, loss: 0.19851, accuracy: 0.95 [Train] epoch: 8, step: 2190, loss: 0.06843, accuracy: 0.95 [Train] epoch: 8, step: 2191, loss: 0.12990, accuracy: 0.90 [Train] epoch: 8, step: 2192, loss: 0.21889, accuracy: 0.90 [Train] epoch: 8, step: 2193, loss: 0.07002, accuracy: 1.00 [Train] epoch: 8, step: 2194, loss: 0.07815, accuracy: 0.95 [Train] epoch: 8, step: 2195, loss: 0.35507, accuracy: 0.90 [Train] epoch: 8, step:

[Train] epoch: 8, step: 2483, loss: 0.08068, accuracy: 1.00 [Train] epoch: 8, step: 2484, loss: 0.19663, accuracy: 0.90 [Train] epoch: 8, step: 2485, loss: 0.15696, accuracy: 0.90 [Train] epoch: 8, step: 2486, loss: 0.08543, accuracy: 1.00 [Train] epoch: 8, step: 2487, loss: 0.47932, accuracy: 0.85 [Train] epoch: 8, step: 2488, loss: 0.17460, accuracy: 0.85 [Train] epoch: 8, step: 2489, loss: 0.19688, accuracy: 0.90 [Train] epoch: 8, step: 2490, loss: 0.12534, accuracy: 1.00 [Train] epoch: 8, step: 2491, loss: 0.25771, accuracy: 0.95 [Train] epoch: 8, step: 2492, loss: 0.09648, accuracy: 0.95 [Train] epoch: 8, step: 2493, loss: 0.09012, accuracy: 1.00 [Train] epoch: 8, step: 2494, loss: 0.06151, accuracy: 1.00 [Train] epoch: 8, step: 2495, loss: 0.12920, accuracy: 0.95 [Train] epoch: 8, step: 2496, loss: 0.16389, accuracy: 0.95 [Train] epoch: 8, step: 2497, loss: 0.15469, accuracy: 0.90 [Train] epoch: 8, step: 2498, loss: 0.46205, accuracy: 0.75 [Train] epoch: 8, step:

[Train] epoch: 8, step: 2744, loss: 0.35829, accuracy: 0.85 [Train] epoch: 8, step: 2745, loss: 0.40678, accuracy: 0.90 [Train] epoch: 8, step: 2746, loss: 0.08469, accuracy: 0.95 [Train] epoch: 8, step: 2747, loss: 0.28434, accuracy: 0.90 [Train] epoch: 8, step: 2748, loss: 0.25170, accuracy: 0.90 [Train] epoch: 8, step: 2749, loss: 0.11399, accuracy: 0.90 [Train] epoch: 9, step: 0, loss: 0.15336, accuracy: 0.95 [Train] epoch: 9, step: 1, loss: 0.18745, accuracy: 0.95 [Train] epoch: 9, step: 2, loss: 0.42663, accuracy: 0.75 [Train] epoch: 9, step: 3, loss: 0.23043, accuracy: 0.90 [Train] epoch: 9, step: 4, loss: 0.22537, accuracy: 0.90 [Train] epoch: 9, step: 5, loss: 0.43272, accuracy: 0.85 [Train] epoch: 9, step: 6, loss: 0.37294, accuracy: 0.80 [Train] epoch: 9, step: 7, loss: 0.19938, accuracy: 0.95 [Train] epoch: 9, step: 8, loss: 0.42984, accuracy: 0.85 [Train] epoch: 9, step: 9, loss: 0.26999, accuracy: 0.95 [Train] epoch: 9, step: 10, loss: 0.25235, accuracy: 

[Train] epoch: 9, step: 280, loss: 0.10817, accuracy: 1.00 [Train] epoch: 9, step: 281, loss: 0.11088, accuracy: 1.00 [Train] epoch: 9, step: 282, loss: 0.23646, accuracy: 0.90 [Train] epoch: 9, step: 283, loss: 0.05369, accuracy: 1.00 [Train] epoch: 9, step: 284, loss: 0.09653, accuracy: 0.95 [Train] epoch: 9, step: 285, loss: 0.30982, accuracy: 0.85 [Train] epoch: 9, step: 286, loss: 0.18469, accuracy: 0.90 [Train] epoch: 9, step: 287, loss: 0.15442, accuracy: 0.95 [Train] epoch: 9, step: 288, loss: 0.20175, accuracy: 0.95 [Train] epoch: 9, step: 289, loss: 0.14805, accuracy: 0.95 [Train] epoch: 9, step: 290, loss: 0.17216, accuracy: 0.95 [Train] epoch: 9, step: 291, loss: 0.53883, accuracy: 0.80 [Train] epoch: 9, step: 292, loss: 0.04423, accuracy: 1.00 [Train] epoch: 9, step: 293, loss: 0.13982, accuracy: 0.95 [Train] epoch: 9, step: 294, loss: 0.18301, accuracy: 0.90 [Train] epoch: 9, step: 295, loss: 0.10415, accuracy: 0.95 [Train] epoch: 9, step: 296, loss: 0.35

[Train] epoch: 9, step: 561, loss: 0.18920, accuracy: 0.95 [Train] epoch: 9, step: 562, loss: 0.09464, accuracy: 1.00 [Train] epoch: 9, step: 563, loss: 0.47384, accuracy: 0.80 [Train] epoch: 9, step: 564, loss: 0.17357, accuracy: 0.95 [Train] epoch: 9, step: 565, loss: 0.35629, accuracy: 0.85 [Train] epoch: 9, step: 566, loss: 0.12704, accuracy: 0.95 [Train] epoch: 9, step: 567, loss: 0.01501, accuracy: 1.00 [Train] epoch: 9, step: 568, loss: 0.42331, accuracy: 0.75 [Train] epoch: 9, step: 569, loss: 0.10737, accuracy: 0.95 [Train] epoch: 9, step: 570, loss: 0.09170, accuracy: 0.95 [Train] epoch: 9, step: 571, loss: 0.57196, accuracy: 0.85 [Train] epoch: 9, step: 572, loss: 0.05426, accuracy: 0.95 [Train] epoch: 9, step: 573, loss: 0.26859, accuracy: 0.85 [Train] epoch: 9, step: 574, loss: 0.52189, accuracy: 0.85 [Train] epoch: 9, step: 575, loss: 0.23522, accuracy: 0.95 [Train] epoch: 9, step: 576, loss: 1.10607, accuracy: 0.75 [Train] epoch: 9, step: 577, loss: 0.23

[Train] epoch: 9, step: 854, loss: 0.30465, accuracy: 0.90 [Train] epoch: 9, step: 855, loss: 0.37124, accuracy: 0.85 [Train] epoch: 9, step: 856, loss: 0.31549, accuracy: 0.90 [Train] epoch: 9, step: 857, loss: 0.08149, accuracy: 1.00 [Train] epoch: 9, step: 858, loss: 0.28318, accuracy: 0.85 [Train] epoch: 9, step: 859, loss: 0.83784, accuracy: 0.85 [Train] epoch: 9, step: 860, loss: 0.08590, accuracy: 0.95 [Train] epoch: 9, step: 861, loss: 0.17750, accuracy: 0.85 [Train] epoch: 9, step: 862, loss: 0.18354, accuracy: 0.90 [Train] epoch: 9, step: 863, loss: 0.48608, accuracy: 0.90 [Train] epoch: 9, step: 864, loss: 0.25152, accuracy: 0.90 [Train] epoch: 9, step: 865, loss: 0.13041, accuracy: 0.95 [Train] epoch: 9, step: 866, loss: 0.04625, accuracy: 1.00 [Train] epoch: 9, step: 867, loss: 0.11036, accuracy: 0.95 [Train] epoch: 9, step: 868, loss: 0.26154, accuracy: 0.95 [Train] epoch: 9, step: 869, loss: 0.14344, accuracy: 1.00 [Train] epoch: 9, step: 870, loss: 0.16

[Train] epoch: 9, step: 1153, loss: 0.17102, accuracy: 0.95 [Train] epoch: 9, step: 1154, loss: 0.21100, accuracy: 0.95 [Train] epoch: 9, step: 1155, loss: 0.01633, accuracy: 1.00 [Train] epoch: 9, step: 1156, loss: 0.34591, accuracy: 0.85 [Train] epoch: 9, step: 1157, loss: 0.18198, accuracy: 0.95 [Train] epoch: 9, step: 1158, loss: 0.25908, accuracy: 0.85 [Train] epoch: 9, step: 1159, loss: 0.22536, accuracy: 0.90 [Train] epoch: 9, step: 1160, loss: 0.06943, accuracy: 1.00 [Train] epoch: 9, step: 1161, loss: 0.21547, accuracy: 0.85 [Train] epoch: 9, step: 1162, loss: 0.02122, accuracy: 1.00 [Train] epoch: 9, step: 1163, loss: 0.24010, accuracy: 0.95 [Train] epoch: 9, step: 1164, loss: 0.33856, accuracy: 0.90 [Train] epoch: 9, step: 1165, loss: 0.27691, accuracy: 0.90 [Train] epoch: 9, step: 1166, loss: 0.09223, accuracy: 0.95 [Train] epoch: 9, step: 1167, loss: 0.47376, accuracy: 0.90 [Train] epoch: 9, step: 1168, loss: 0.27291, accuracy: 0.85 [Train] epoch: 9, step:

[Train] epoch: 9, step: 1456, loss: 0.08497, accuracy: 1.00 [Train] epoch: 9, step: 1457, loss: 0.17656, accuracy: 0.90 [Train] epoch: 9, step: 1458, loss: 0.03217, accuracy: 1.00 [Train] epoch: 9, step: 1459, loss: 0.24280, accuracy: 0.85 [Train] epoch: 9, step: 1460, loss: 0.21667, accuracy: 0.85 [Train] epoch: 9, step: 1461, loss: 0.10923, accuracy: 0.95 [Train] epoch: 9, step: 1462, loss: 0.02920, accuracy: 1.00 [Train] epoch: 9, step: 1463, loss: 0.29845, accuracy: 0.85 [Train] epoch: 9, step: 1464, loss: 0.24930, accuracy: 0.90 [Train] epoch: 9, step: 1465, loss: 0.23752, accuracy: 0.80 [Train] epoch: 9, step: 1466, loss: 0.12809, accuracy: 0.95 [Train] epoch: 9, step: 1467, loss: 0.13336, accuracy: 0.90 [Train] epoch: 9, step: 1468, loss: 0.38731, accuracy: 0.85 [Train] epoch: 9, step: 1469, loss: 0.57899, accuracy: 0.80 [Train] epoch: 9, step: 1470, loss: 0.06764, accuracy: 1.00 [Train] epoch: 9, step: 1471, loss: 0.58481, accuracy: 0.90 [Train] epoch: 9, step:

[Train] epoch: 9, step: 1765, loss: 0.19730, accuracy: 0.95 [Train] epoch: 9, step: 1766, loss: 0.11041, accuracy: 1.00 [Train] epoch: 9, step: 1767, loss: 0.33522, accuracy: 0.90 [Train] epoch: 9, step: 1768, loss: 0.47594, accuracy: 0.80 [Train] epoch: 9, step: 1769, loss: 0.12510, accuracy: 0.95 [Train] epoch: 9, step: 1770, loss: 0.06196, accuracy: 1.00 [Train] epoch: 9, step: 1771, loss: 0.09510, accuracy: 1.00 [Train] epoch: 9, step: 1772, loss: 0.12539, accuracy: 0.95 [Train] epoch: 9, step: 1773, loss: 0.19504, accuracy: 0.90 [Train] epoch: 9, step: 1774, loss: 0.10145, accuracy: 0.95 [Train] epoch: 9, step: 1775, loss: 0.54025, accuracy: 0.90 [Train] epoch: 9, step: 1776, loss: 0.03713, accuracy: 1.00 [Train] epoch: 9, step: 1777, loss: 0.20795, accuracy: 0.90 [Train] epoch: 9, step: 1778, loss: 0.24609, accuracy: 0.90 [Train] epoch: 9, step: 1779, loss: 0.25700, accuracy: 0.90 [Train] epoch: 9, step: 1780, loss: 0.05405, accuracy: 1.00 [Train] epoch: 9, step:

[Train] epoch: 9, step: 2076, loss: 0.17043, accuracy: 0.90 [Train] epoch: 9, step: 2077, loss: 0.21524, accuracy: 0.90 [Train] epoch: 9, step: 2078, loss: 0.12012, accuracy: 0.95 [Train] epoch: 9, step: 2079, loss: 0.06212, accuracy: 1.00 [Train] epoch: 9, step: 2080, loss: 0.23416, accuracy: 0.90 [Train] epoch: 9, step: 2081, loss: 0.24786, accuracy: 0.90 [Train] epoch: 9, step: 2082, loss: 0.26977, accuracy: 0.90 [Train] epoch: 9, step: 2083, loss: 0.08135, accuracy: 1.00 [Train] epoch: 9, step: 2084, loss: 0.10721, accuracy: 0.95 [Train] epoch: 9, step: 2085, loss: 0.27539, accuracy: 0.95 [Train] epoch: 9, step: 2086, loss: 0.03001, accuracy: 1.00 [Train] epoch: 9, step: 2087, loss: 0.14149, accuracy: 0.95 [Train] epoch: 9, step: 2088, loss: 0.15999, accuracy: 0.95 [Train] epoch: 9, step: 2089, loss: 0.24141, accuracy: 0.90 [Train] epoch: 9, step: 2090, loss: 0.05683, accuracy: 1.00 [Train] epoch: 9, step: 2091, loss: 0.50794, accuracy: 0.85 [Train] epoch: 9, step:

[Train] epoch: 9, step: 2381, loss: 0.22199, accuracy: 0.95 [Train] epoch: 9, step: 2382, loss: 0.32666, accuracy: 0.90 [Train] epoch: 9, step: 2383, loss: 0.29511, accuracy: 0.85 [Train] epoch: 9, step: 2384, loss: 0.33314, accuracy: 0.85 [Train] epoch: 9, step: 2385, loss: 0.15609, accuracy: 0.95 [Train] epoch: 9, step: 2386, loss: 0.46801, accuracy: 0.75 [Train] epoch: 9, step: 2387, loss: 0.57326, accuracy: 0.85 [Train] epoch: 9, step: 2388, loss: 0.24417, accuracy: 0.90 [Train] epoch: 9, step: 2389, loss: 0.17600, accuracy: 0.90 [Train] epoch: 9, step: 2390, loss: 0.14761, accuracy: 0.95 [Train] epoch: 9, step: 2391, loss: 0.25891, accuracy: 0.85 [Train] epoch: 9, step: 2392, loss: 0.09925, accuracy: 1.00 [Train] epoch: 9, step: 2393, loss: 0.24671, accuracy: 0.95 [Train] epoch: 9, step: 2394, loss: 0.08128, accuracy: 1.00 [Train] epoch: 9, step: 2395, loss: 0.14171, accuracy: 0.95 [Train] epoch: 9, step: 2396, loss: 0.13542, accuracy: 0.95 [Train] epoch: 9, step:

[Train] epoch: 9, step: 2677, loss: 0.07844, accuracy: 1.00 [Train] epoch: 9, step: 2678, loss: 0.23935, accuracy: 0.85 [Train] epoch: 9, step: 2679, loss: 0.41654, accuracy: 0.90 [Train] epoch: 9, step: 2680, loss: 0.86355, accuracy: 0.85 [Train] epoch: 9, step: 2681, loss: 0.06774, accuracy: 0.95 [Train] epoch: 9, step: 2682, loss: 0.35412, accuracy: 0.85 [Train] epoch: 9, step: 2683, loss: 0.19661, accuracy: 0.90 [Train] epoch: 9, step: 2684, loss: 0.04362, accuracy: 1.00 [Train] epoch: 9, step: 2685, loss: 0.36215, accuracy: 0.90 [Train] epoch: 9, step: 2686, loss: 0.23248, accuracy: 0.95 [Train] epoch: 9, step: 2687, loss: 0.27862, accuracy: 0.90 [Train] epoch: 9, step: 2688, loss: 0.14212, accuracy: 0.95 [Train] epoch: 9, step: 2689, loss: 0.11942, accuracy: 0.95 [Train] epoch: 9, step: 2690, loss: 0.32322, accuracy: 0.90 [Train] epoch: 9, step: 2691, loss: 0.13157, accuracy: 0.90 [Train] epoch: 9, step: 2692, loss: 0.20966, accuracy: 0.95 [Train] epoch: 9, step: