In [1]:
import matplotlib as mpl
import matplotlib.pyplot as plt
%matplotlib inline
import numpy as np
import sklearn
import pandas as pd
import os
import sys
import time
import tensorflow as tf

from tensorflow import keras

print(tf.__version__)
print(sys.version_info)
for module in mpl,np,pd,sklearn,tf,keras:
    print(module.__name__,module.__version__)

tf.test.is_gpu_available()

  _np_qint8 = np.dtype([("qint8", np.int8, 1)])
  _np_quint8 = np.dtype([("quint8", np.uint8, 1)])
  _np_qint16 = np.dtype([("qint16", np.int16, 1)])
  _np_quint16 = np.dtype([("quint16", np.uint16, 1)])
  _np_qint32 = np.dtype([("qint32", np.int32, 1)])
  np_resource = np.dtype([("resource", np.ubyte, 1)])


1.13.1
sys.version_info(major=3, minor=7, micro=4, releaselevel='final', serial=0)
matplotlib 3.1.2
numpy 1.18.1
pandas 0.25.3
sklearn 0.22.1
tensorflow 1.13.1
tensorflow._api.v1.keras 2.2.4-tf


False

# Tf1.0
### Tf1.0实现全连接网络
```python
placeholder,session,feed_dict
1、placeholder, tf.layers.dense, tf.train.AdamOptimizer
2、tf.losses.sparse_softmax_cross_entropy
3、Tf.global_variables_initializer,feed_dict
```
### Dataset使用
```python
1、Dataset.make_one_shot_iterator
2、Dataset.make_initializable_iterator
```
### 自定义estimator
```python
1、Tf.feature_column.input_layer
2、Tf.estimator.EstimatorSpec
3、Tf.metrics.accuracy
```

In [2]:
fashion_mnist = keras.datasets.fashion_mnist
(x_train_all,y_train_all),(x_test, y_test) = fashion_mnist.load_data()
x_valid,x_train = x_train_all[:5000],x_train_all[5000:]
y_valid,y_train = y_train_all[:5000],y_train_all[5000:]

print(x_train.shape,y_train.shape)
print(x_valid.shape,y_valid.shape)
print(x_test.shape,y_test.shape)
print(np.max(x_train),np.min(x_train))

from sklearn.preprocessing import StandardScaler

scaler = StandardScaler()
# x_train:[None,28,28] -> [None,784]
x_train_scaled = scaler.fit_transform(
    x_train.astype(np.float32).reshape(-1,1)).reshape(-1,28*28)
x_valid_scaled = scaler.fit_transform(
    x_valid.astype(np.float32).reshape(-1,1)).reshape(-1,28*28)
x_test_scaled = scaler.fit_transform(
    x_test.astype(np.float32).reshape(-1,1)).reshape(-1,28*28)
print(np.max(x_train_scaled),np.min(x_train_scaled))

(55000, 28, 28) (55000,)
(5000, 28, 28) (5000,)
(10000, 28, 28) (10000,)
255 0
2.0231433 -0.8105136


In [3]:
# 构建模型
hidden_units = [100,100]
class_num = 10 # 10分类

x = tf.placeholder(tf.float32,[None,28 * 28])
y = tf.placeholder(tf.int64, [None])

input_for_next_layer = x
# 隐藏层
for hidden_unit in hidden_units:
    input_for_next_layer = tf.layers.dense(input_for_next_layer,
                                           hidden_unit,
                                           activation=tf.nn.relu)
# 输出层
logits = tf.layers.dense(input_for_next_layer,
                         class_num)

# loss计算
# 1. 将最后一层的输出做softmax计算出prob(每种分类的概率)
# 2. labels -> one_hot 将标签进行one-hot编码
# 3. 计算loss：就是去概率最大的那个max_prob进行-log(max_prob)的计算
loss = tf.losses.sparse_softmax_cross_entropy(labels = y,
                                              logits = logits)

# 计算正确率accuracy
# 取出概率最大的那个位置的索引位置作为预测
prediction = tf.argmax(logits, 1)
correct_prediction = tf.equal(prediction,y) # 正确的为1，错误的为0
# 先将int值转为float类型然后在进行正确率的计算
accuracy = tf.reduce_mean(tf.cast(correct_prediction,tf.float64)) 

# 定义train_op,在训练的时候就是调用train_op
train_op = tf.train.AdamOptimizer(1e-3).minimize(loss)

Instructions for updating:
Use keras.layers.dense instead.
Instructions for updating:
Colocations handled automatically by placer.
Instructions for updating:
Use tf.cast instead.


In [4]:
print(x)
print(logits)

Tensor("Placeholder:0", shape=(?, 784), dtype=float32)
Tensor("dense_2/BiasAdd:0", shape=(?, 10), dtype=float32)


In [6]:
# 模型训练
init = tf.global_variables_initializer()
batch_size = 32
epochs = 10
train_steps_per_epoch = x_train_scaled.shape[0] // batch_size
valid_steps = x_valid_scaled.shape[0] // batch_size

# 定义计算正确率的方法
def eval_with_sess(sess,x,y,accuracy,images,labels,batch_size):
    eval_steps = images.shape[0] // batch_size
    eval_accuracies = []
    for step in range(eval_steps):
        batch_data = images[step * batch_size : (step+1) * batch_size]
        batch_label = labels[step * batch_size : (step+1) * batch_size]
        accuracy_val = sess.run(accuracy,
                                feed_dict = {
                                    x:batch_data,
                                    y:batch_label
                                })
        eval_accuracies.append(accuracy_val)
    return np.mean(eval_accuracies)

with tf.Session() as sess:
    sess.run(init)
    for epoch in range(epochs):
        for step in range(train_steps_per_epoch):
            batch_data = x_train_scaled[step * batch_size : (step+1) * batch_size]
            batch_label = y_train[step * batch_size : (step+1) * batch_size]
            # 同时run多个op
            loss_val,accuracy_val,_ = sess.run(
                [loss,accuracy,train_op],
                feed_dict = { # 在此次训练时要填入的数据
                    x:batch_data,
                    y:batch_label
                })
            print('\r[Train] epoch: %d, step: %d, loss: %3.5f, accuracy: %2.2f' % 
                  (epoch,step,loss_val,accuracy_val),end="")
        valid_accuracy = eval_with_sess(sess,x,y,accuracy,
                                        x_valid_scaled,y_valid,
                                        batch_size= batch_size)
        print("\t[Valid] acc: %2.2f" % valid_accuracy)

[Train] epoch: 0, step: 0, loss: 2.88835, accuracy: 0.06[Train] epoch: 0, step: 1, loss: 2.33602, accuracy: 0.12[Train] epoch: 0, step: 2, loss: 2.18071, accuracy: 0.12[Train] epoch: 0, step: 3, loss: 1.87135, accuracy: 0.44[Train] epoch: 0, step: 4, loss: 1.80056, accuracy: 0.41[Train] epoch: 0, step: 5, loss: 1.56830, accuracy: 0.53[Train] epoch: 0, step: 6, loss: 1.65816, accuracy: 0.56[Train] epoch: 0, step: 7, loss: 1.81688, accuracy: 0.44[Train] epoch: 0, step: 8, loss: 1.76390, accuracy: 0.38[Train] epoch: 0, step: 9, loss: 1.30762, accuracy: 0.59[Train] epoch: 0, step: 10, loss: 1.10840, accuracy: 0.72[Train] epoch: 0, step: 11, loss: 1.30543, accuracy: 0.47[Train] epoch: 0, step: 12, loss: 1.30122, accuracy: 0.62[Train] epoch: 0, step: 13, loss: 1.22797, accuracy: 0.53[Train] epoch: 0, step: 14, loss: 0.99470, accuracy: 0.62[Train] epoch: 0, step: 15, loss: 1.24754, accuracy: 0.50[Train] epoch: 0, step: 16, loss: 0.82815, accuracy: 0.78[Train] epoch: 0, step:

[Train] epoch: 0, step: 270, loss: 0.51959, accuracy: 0.72[Train] epoch: 0, step: 271, loss: 0.43771, accuracy: 0.88[Train] epoch: 0, step: 272, loss: 0.42245, accuracy: 0.81[Train] epoch: 0, step: 273, loss: 0.38793, accuracy: 0.84[Train] epoch: 0, step: 274, loss: 0.59257, accuracy: 0.84[Train] epoch: 0, step: 275, loss: 0.26386, accuracy: 0.88[Train] epoch: 0, step: 276, loss: 0.46909, accuracy: 0.81[Train] epoch: 0, step: 277, loss: 0.62259, accuracy: 0.72[Train] epoch: 0, step: 278, loss: 0.48893, accuracy: 0.72[Train] epoch: 0, step: 279, loss: 0.79409, accuracy: 0.69[Train] epoch: 0, step: 280, loss: 0.48130, accuracy: 0.81[Train] epoch: 0, step: 281, loss: 0.43745, accuracy: 0.78[Train] epoch: 0, step: 282, loss: 0.72069, accuracy: 0.69[Train] epoch: 0, step: 283, loss: 0.52199, accuracy: 0.72[Train] epoch: 0, step: 284, loss: 0.57368, accuracy: 0.75[Train] epoch: 0, step: 285, loss: 0.41733, accuracy: 0.84[Train] epoch: 0, step: 286, loss: 0.70543, accuracy: 0

[Train] epoch: 0, step: 539, loss: 0.43097, accuracy: 0.88[Train] epoch: 0, step: 540, loss: 0.96407, accuracy: 0.69[Train] epoch: 0, step: 541, loss: 0.24739, accuracy: 0.91[Train] epoch: 0, step: 542, loss: 0.51826, accuracy: 0.78[Train] epoch: 0, step: 543, loss: 0.29248, accuracy: 0.84[Train] epoch: 0, step: 544, loss: 0.15214, accuracy: 0.97[Train] epoch: 0, step: 545, loss: 0.34112, accuracy: 0.84[Train] epoch: 0, step: 546, loss: 0.23560, accuracy: 0.94[Train] epoch: 0, step: 547, loss: 0.55717, accuracy: 0.84[Train] epoch: 0, step: 548, loss: 0.50139, accuracy: 0.78[Train] epoch: 0, step: 549, loss: 0.95186, accuracy: 0.84[Train] epoch: 0, step: 550, loss: 0.27049, accuracy: 0.88[Train] epoch: 0, step: 551, loss: 0.33388, accuracy: 0.88[Train] epoch: 0, step: 552, loss: 0.33665, accuracy: 0.84[Train] epoch: 0, step: 553, loss: 0.59359, accuracy: 0.81[Train] epoch: 0, step: 554, loss: 0.23029, accuracy: 0.91[Train] epoch: 0, step: 555, loss: 0.83443, accuracy: 0

[Train] epoch: 0, step: 817, loss: 0.27444, accuracy: 0.91[Train] epoch: 0, step: 818, loss: 0.32648, accuracy: 0.91[Train] epoch: 0, step: 819, loss: 0.70544, accuracy: 0.72[Train] epoch: 0, step: 820, loss: 0.71128, accuracy: 0.69[Train] epoch: 0, step: 821, loss: 0.39295, accuracy: 0.91[Train] epoch: 0, step: 822, loss: 0.51711, accuracy: 0.78[Train] epoch: 0, step: 823, loss: 0.33950, accuracy: 0.84[Train] epoch: 0, step: 824, loss: 0.17412, accuracy: 0.94[Train] epoch: 0, step: 825, loss: 0.24132, accuracy: 0.88[Train] epoch: 0, step: 826, loss: 0.67784, accuracy: 0.75[Train] epoch: 0, step: 827, loss: 0.27837, accuracy: 0.91[Train] epoch: 0, step: 828, loss: 0.45651, accuracy: 0.81[Train] epoch: 0, step: 829, loss: 0.45229, accuracy: 0.91[Train] epoch: 0, step: 830, loss: 0.27258, accuracy: 0.91[Train] epoch: 0, step: 831, loss: 0.36106, accuracy: 0.88[Train] epoch: 0, step: 832, loss: 0.54097, accuracy: 0.75[Train] epoch: 0, step: 833, loss: 0.52245, accuracy: 0

[Train] epoch: 0, step: 1099, loss: 0.54227, accuracy: 0.81[Train] epoch: 0, step: 1100, loss: 0.21458, accuracy: 0.91[Train] epoch: 0, step: 1101, loss: 0.30164, accuracy: 0.88[Train] epoch: 0, step: 1102, loss: 0.33715, accuracy: 0.91[Train] epoch: 0, step: 1103, loss: 0.18993, accuracy: 0.97[Train] epoch: 0, step: 1104, loss: 0.36074, accuracy: 0.81[Train] epoch: 0, step: 1105, loss: 0.57425, accuracy: 0.75[Train] epoch: 0, step: 1106, loss: 0.41947, accuracy: 0.84[Train] epoch: 0, step: 1107, loss: 0.23604, accuracy: 0.97[Train] epoch: 0, step: 1108, loss: 0.36408, accuracy: 0.88[Train] epoch: 0, step: 1109, loss: 0.58134, accuracy: 0.84[Train] epoch: 0, step: 1110, loss: 0.46943, accuracy: 0.91[Train] epoch: 0, step: 1111, loss: 0.38447, accuracy: 0.84[Train] epoch: 0, step: 1112, loss: 0.37016, accuracy: 0.88[Train] epoch: 0, step: 1113, loss: 0.55839, accuracy: 0.75[Train] epoch: 0, step: 1114, loss: 0.20582, accuracy: 0.97[Train] epoch: 0, step: 1115, loss: 0.3

[Train] epoch: 0, step: 1377, loss: 0.34253, accuracy: 0.81[Train] epoch: 0, step: 1378, loss: 0.26522, accuracy: 0.84[Train] epoch: 0, step: 1379, loss: 0.43151, accuracy: 0.91[Train] epoch: 0, step: 1380, loss: 0.31764, accuracy: 0.91[Train] epoch: 0, step: 1381, loss: 0.31364, accuracy: 0.88[Train] epoch: 0, step: 1382, loss: 0.38242, accuracy: 0.84[Train] epoch: 0, step: 1383, loss: 0.33264, accuracy: 0.91[Train] epoch: 0, step: 1384, loss: 0.37302, accuracy: 0.84[Train] epoch: 0, step: 1385, loss: 0.81406, accuracy: 0.78[Train] epoch: 0, step: 1386, loss: 0.37277, accuracy: 0.91[Train] epoch: 0, step: 1387, loss: 0.56118, accuracy: 0.75[Train] epoch: 0, step: 1388, loss: 0.46550, accuracy: 0.91[Train] epoch: 0, step: 1389, loss: 0.22948, accuracy: 0.91[Train] epoch: 0, step: 1390, loss: 0.47253, accuracy: 0.78[Train] epoch: 0, step: 1391, loss: 0.17742, accuracy: 0.94[Train] epoch: 0, step: 1392, loss: 0.54157, accuracy: 0.81[Train] epoch: 0, step: 1393, loss: 0.3

[Train] epoch: 0, step: 1652, loss: 0.52688, accuracy: 0.75[Train] epoch: 0, step: 1653, loss: 0.31172, accuracy: 0.91[Train] epoch: 0, step: 1654, loss: 0.26993, accuracy: 0.91[Train] epoch: 0, step: 1655, loss: 0.36428, accuracy: 0.91[Train] epoch: 0, step: 1656, loss: 0.43241, accuracy: 0.81[Train] epoch: 0, step: 1657, loss: 0.43729, accuracy: 0.84[Train] epoch: 0, step: 1658, loss: 0.43191, accuracy: 0.84[Train] epoch: 0, step: 1659, loss: 0.57851, accuracy: 0.78[Train] epoch: 0, step: 1660, loss: 0.29319, accuracy: 0.91[Train] epoch: 0, step: 1661, loss: 0.61954, accuracy: 0.81[Train] epoch: 0, step: 1662, loss: 0.36058, accuracy: 0.84[Train] epoch: 0, step: 1663, loss: 0.34477, accuracy: 0.91[Train] epoch: 0, step: 1664, loss: 0.26089, accuracy: 0.84[Train] epoch: 0, step: 1665, loss: 0.41295, accuracy: 0.81[Train] epoch: 0, step: 1666, loss: 0.55231, accuracy: 0.78[Train] epoch: 0, step: 1667, loss: 0.26472, accuracy: 0.88[Train] epoch: 0, step: 1668, loss: 0.3

[Train] epoch: 1, step: 0, loss: 0.27425, accuracy: 0.88[Train] epoch: 1, step: 1, loss: 0.66411, accuracy: 0.78[Train] epoch: 1, step: 2, loss: 0.39664, accuracy: 0.75[Train] epoch: 1, step: 3, loss: 0.42495, accuracy: 0.84[Train] epoch: 1, step: 4, loss: 0.51301, accuracy: 0.81[Train] epoch: 1, step: 5, loss: 0.58279, accuracy: 0.84[Train] epoch: 1, step: 6, loss: 0.35503, accuracy: 0.88[Train] epoch: 1, step: 7, loss: 0.76668, accuracy: 0.72[Train] epoch: 1, step: 8, loss: 0.56880, accuracy: 0.78[Train] epoch: 1, step: 9, loss: 0.36753, accuracy: 0.84[Train] epoch: 1, step: 10, loss: 0.58719, accuracy: 0.78[Train] epoch: 1, step: 11, loss: 0.64287, accuracy: 0.78[Train] epoch: 1, step: 12, loss: 0.50524, accuracy: 0.81[Train] epoch: 1, step: 13, loss: 0.53951, accuracy: 0.75[Train] epoch: 1, step: 14, loss: 0.28760, accuracy: 0.78[Train] epoch: 1, step: 15, loss: 0.52457, accuracy: 0.78[Train] epoch: 1, step: 16, loss: 0.28649, accuracy: 0.94[Train] epoch: 1, step:

[Train] epoch: 1, step: 380, loss: 0.24032, accuracy: 0.91[Train] epoch: 1, step: 381, loss: 0.51388, accuracy: 0.78[Train] epoch: 1, step: 382, loss: 0.85936, accuracy: 0.75[Train] epoch: 1, step: 383, loss: 0.33720, accuracy: 0.88[Train] epoch: 1, step: 384, loss: 0.51048, accuracy: 0.81[Train] epoch: 1, step: 385, loss: 0.54496, accuracy: 0.78[Train] epoch: 1, step: 386, loss: 0.45478, accuracy: 0.84[Train] epoch: 1, step: 387, loss: 0.27510, accuracy: 0.88[Train] epoch: 1, step: 388, loss: 0.51349, accuracy: 0.84[Train] epoch: 1, step: 389, loss: 0.38695, accuracy: 0.81[Train] epoch: 1, step: 390, loss: 0.21256, accuracy: 0.94[Train] epoch: 1, step: 391, loss: 0.66577, accuracy: 0.75[Train] epoch: 1, step: 392, loss: 0.38081, accuracy: 0.81[Train] epoch: 1, step: 393, loss: 0.29338, accuracy: 0.88[Train] epoch: 1, step: 394, loss: 0.35180, accuracy: 0.88[Train] epoch: 1, step: 395, loss: 0.86126, accuracy: 0.72[Train] epoch: 1, step: 396, loss: 0.52574, accuracy: 0

[Train] epoch: 1, step: 660, loss: 0.30242, accuracy: 0.94[Train] epoch: 1, step: 661, loss: 0.17905, accuracy: 0.94[Train] epoch: 1, step: 662, loss: 0.63072, accuracy: 0.75[Train] epoch: 1, step: 663, loss: 0.65501, accuracy: 0.84[Train] epoch: 1, step: 664, loss: 0.52916, accuracy: 0.75[Train] epoch: 1, step: 665, loss: 0.33156, accuracy: 0.81[Train] epoch: 1, step: 666, loss: 0.29006, accuracy: 0.84[Train] epoch: 1, step: 667, loss: 0.29714, accuracy: 0.88[Train] epoch: 1, step: 668, loss: 0.34323, accuracy: 0.91[Train] epoch: 1, step: 669, loss: 0.46313, accuracy: 0.81[Train] epoch: 1, step: 670, loss: 0.36154, accuracy: 0.88[Train] epoch: 1, step: 671, loss: 0.25518, accuracy: 0.91[Train] epoch: 1, step: 672, loss: 0.19899, accuracy: 0.88[Train] epoch: 1, step: 673, loss: 0.18940, accuracy: 0.94[Train] epoch: 1, step: 674, loss: 0.22598, accuracy: 0.88[Train] epoch: 1, step: 675, loss: 0.10853, accuracy: 0.97[Train] epoch: 1, step: 676, loss: 0.25605, accuracy: 0

[Train] epoch: 1, step: 937, loss: 0.26331, accuracy: 0.88[Train] epoch: 1, step: 938, loss: 0.28950, accuracy: 0.94[Train] epoch: 1, step: 939, loss: 0.26859, accuracy: 0.94[Train] epoch: 1, step: 940, loss: 0.34513, accuracy: 0.88[Train] epoch: 1, step: 941, loss: 0.37359, accuracy: 0.84[Train] epoch: 1, step: 942, loss: 0.31095, accuracy: 0.91[Train] epoch: 1, step: 943, loss: 0.35764, accuracy: 0.88[Train] epoch: 1, step: 944, loss: 0.32901, accuracy: 0.88[Train] epoch: 1, step: 945, loss: 0.30799, accuracy: 0.88[Train] epoch: 1, step: 946, loss: 0.49428, accuracy: 0.88[Train] epoch: 1, step: 947, loss: 0.41878, accuracy: 0.94[Train] epoch: 1, step: 948, loss: 0.41421, accuracy: 0.88[Train] epoch: 1, step: 949, loss: 0.17600, accuracy: 0.94[Train] epoch: 1, step: 950, loss: 0.17413, accuracy: 0.97[Train] epoch: 1, step: 951, loss: 0.37106, accuracy: 0.78[Train] epoch: 1, step: 952, loss: 0.35137, accuracy: 0.84[Train] epoch: 1, step: 953, loss: 0.38393, accuracy: 0

[Train] epoch: 1, step: 1216, loss: 0.31361, accuracy: 0.91[Train] epoch: 1, step: 1217, loss: 0.22673, accuracy: 0.94[Train] epoch: 1, step: 1218, loss: 0.45235, accuracy: 0.81[Train] epoch: 1, step: 1219, loss: 0.11451, accuracy: 0.97[Train] epoch: 1, step: 1220, loss: 0.15696, accuracy: 0.97[Train] epoch: 1, step: 1221, loss: 0.47804, accuracy: 0.84[Train] epoch: 1, step: 1222, loss: 0.50051, accuracy: 0.81[Train] epoch: 1, step: 1223, loss: 0.20354, accuracy: 0.91[Train] epoch: 1, step: 1224, loss: 0.19948, accuracy: 0.91[Train] epoch: 1, step: 1225, loss: 0.30341, accuracy: 0.94[Train] epoch: 1, step: 1226, loss: 0.59127, accuracy: 0.78[Train] epoch: 1, step: 1227, loss: 0.39577, accuracy: 0.88[Train] epoch: 1, step: 1228, loss: 0.13923, accuracy: 1.00[Train] epoch: 1, step: 1229, loss: 0.75926, accuracy: 0.75[Train] epoch: 1, step: 1230, loss: 0.39268, accuracy: 0.81[Train] epoch: 1, step: 1231, loss: 0.35438, accuracy: 0.88[Train] epoch: 1, step: 1232, loss: 0.3

[Train] epoch: 1, step: 1486, loss: 0.33614, accuracy: 0.88[Train] epoch: 1, step: 1487, loss: 0.30275, accuracy: 0.88[Train] epoch: 1, step: 1488, loss: 0.41230, accuracy: 0.81[Train] epoch: 1, step: 1489, loss: 0.34014, accuracy: 0.78[Train] epoch: 1, step: 1490, loss: 0.35769, accuracy: 0.84[Train] epoch: 1, step: 1491, loss: 0.37173, accuracy: 0.88[Train] epoch: 1, step: 1492, loss: 0.69989, accuracy: 0.81[Train] epoch: 1, step: 1493, loss: 0.42604, accuracy: 0.88[Train] epoch: 1, step: 1494, loss: 0.16391, accuracy: 0.94[Train] epoch: 1, step: 1495, loss: 0.42812, accuracy: 0.84[Train] epoch: 1, step: 1496, loss: 0.09674, accuracy: 1.00[Train] epoch: 1, step: 1497, loss: 0.34081, accuracy: 0.94[Train] epoch: 1, step: 1498, loss: 0.43563, accuracy: 0.91[Train] epoch: 1, step: 1499, loss: 0.36932, accuracy: 0.91[Train] epoch: 1, step: 1500, loss: 0.33490, accuracy: 0.88[Train] epoch: 1, step: 1501, loss: 0.20408, accuracy: 0.94[Train] epoch: 1, step: 1502, loss: 0.2

	[Valid] acc: 0.87


[Train] epoch: 2, step: 0, loss: 0.21752, accuracy: 0.91[Train] epoch: 2, step: 1, loss: 0.63094, accuracy: 0.84[Train] epoch: 2, step: 2, loss: 0.34448, accuracy: 0.81[Train] epoch: 2, step: 3, loss: 0.36766, accuracy: 0.84[Train] epoch: 2, step: 4, loss: 0.50604, accuracy: 0.84[Train] epoch: 2, step: 5, loss: 0.52000, accuracy: 0.81[Train] epoch: 2, step: 6, loss: 0.30207, accuracy: 0.91[Train] epoch: 2, step: 7, loss: 0.62042, accuracy: 0.81[Train] epoch: 2, step: 8, loss: 0.37335, accuracy: 0.81[Train] epoch: 2, step: 9, loss: 0.33629, accuracy: 0.88[Train] epoch: 2, step: 10, loss: 0.45141, accuracy: 0.84[Train] epoch: 2, step: 11, loss: 0.46384, accuracy: 0.84[Train] epoch: 2, step: 12, loss: 0.49384, accuracy: 0.84[Train] epoch: 2, step: 13, loss: 0.57029, accuracy: 0.72[Train] epoch: 2, step: 14, loss: 0.29338, accuracy: 0.88[Train] epoch: 2, step: 15, loss: 0.41149, accuracy: 0.88[Train] epoch: 2, step: 16, loss: 0.23139, accuracy: 0.94[Train] epoch: 2, step:

[Train] epoch: 2, step: 531, loss: 0.32841, accuracy: 0.88[Train] epoch: 2, step: 532, loss: 0.11796, accuracy: 0.94[Train] epoch: 2, step: 533, loss: 0.47640, accuracy: 0.88[Train] epoch: 2, step: 534, loss: 0.47828, accuracy: 0.84[Train] epoch: 2, step: 535, loss: 0.28172, accuracy: 0.91[Train] epoch: 2, step: 536, loss: 0.30648, accuracy: 0.88[Train] epoch: 2, step: 537, loss: 0.55060, accuracy: 0.81[Train] epoch: 2, step: 538, loss: 0.34172, accuracy: 0.88[Train] epoch: 2, step: 539, loss: 0.35279, accuracy: 0.91[Train] epoch: 2, step: 540, loss: 0.39731, accuracy: 0.84[Train] epoch: 2, step: 541, loss: 0.07215, accuracy: 1.00[Train] epoch: 2, step: 542, loss: 0.33896, accuracy: 0.91[Train] epoch: 2, step: 543, loss: 0.17865, accuracy: 0.94[Train] epoch: 2, step: 544, loss: 0.13590, accuracy: 0.94[Train] epoch: 2, step: 545, loss: 0.23612, accuracy: 0.91[Train] epoch: 2, step: 546, loss: 0.13778, accuracy: 0.97[Train] epoch: 2, step: 547, loss: 0.37404, accuracy: 0

[Train] epoch: 2, step: 807, loss: 0.49820, accuracy: 0.81[Train] epoch: 2, step: 808, loss: 0.28382, accuracy: 0.88[Train] epoch: 2, step: 809, loss: 0.48306, accuracy: 0.78[Train] epoch: 2, step: 810, loss: 0.29101, accuracy: 0.91[Train] epoch: 2, step: 811, loss: 0.34964, accuracy: 0.91[Train] epoch: 2, step: 812, loss: 0.46402, accuracy: 0.88[Train] epoch: 2, step: 813, loss: 0.24443, accuracy: 0.91[Train] epoch: 2, step: 814, loss: 0.17865, accuracy: 0.91[Train] epoch: 2, step: 815, loss: 0.15301, accuracy: 0.94[Train] epoch: 2, step: 816, loss: 0.57929, accuracy: 0.72[Train] epoch: 2, step: 817, loss: 0.20822, accuracy: 0.94[Train] epoch: 2, step: 818, loss: 0.26181, accuracy: 0.97[Train] epoch: 2, step: 819, loss: 0.47756, accuracy: 0.75[Train] epoch: 2, step: 820, loss: 0.57612, accuracy: 0.81[Train] epoch: 2, step: 821, loss: 0.26089, accuracy: 0.91[Train] epoch: 2, step: 822, loss: 0.50925, accuracy: 0.78[Train] epoch: 2, step: 823, loss: 0.26969, accuracy: 0

[Train] epoch: 2, step: 1085, loss: 0.42208, accuracy: 0.84[Train] epoch: 2, step: 1086, loss: 0.12502, accuracy: 0.97[Train] epoch: 2, step: 1087, loss: 0.11368, accuracy: 0.94[Train] epoch: 2, step: 1088, loss: 0.37707, accuracy: 0.88[Train] epoch: 2, step: 1089, loss: 0.36734, accuracy: 0.84[Train] epoch: 2, step: 1090, loss: 0.14738, accuracy: 0.97[Train] epoch: 2, step: 1091, loss: 0.46516, accuracy: 0.84[Train] epoch: 2, step: 1092, loss: 0.26514, accuracy: 0.91[Train] epoch: 2, step: 1093, loss: 0.48613, accuracy: 0.81[Train] epoch: 2, step: 1094, loss: 0.48709, accuracy: 0.84[Train] epoch: 2, step: 1095, loss: 0.47850, accuracy: 0.91[Train] epoch: 2, step: 1096, loss: 0.51207, accuracy: 0.81[Train] epoch: 2, step: 1097, loss: 0.58099, accuracy: 0.78[Train] epoch: 2, step: 1098, loss: 0.38984, accuracy: 0.84[Train] epoch: 2, step: 1099, loss: 0.38350, accuracy: 0.94[Train] epoch: 2, step: 1100, loss: 0.14741, accuracy: 0.91[Train] epoch: 2, step: 1101, loss: 0.2

[Train] epoch: 2, step: 1360, loss: 0.47073, accuracy: 0.88[Train] epoch: 2, step: 1361, loss: 0.28626, accuracy: 0.91[Train] epoch: 2, step: 1362, loss: 0.43522, accuracy: 0.84[Train] epoch: 2, step: 1363, loss: 0.31338, accuracy: 0.88[Train] epoch: 2, step: 1364, loss: 0.27485, accuracy: 0.94[Train] epoch: 2, step: 1365, loss: 0.37539, accuracy: 0.88[Train] epoch: 2, step: 1366, loss: 0.36375, accuracy: 0.88[Train] epoch: 2, step: 1367, loss: 0.46082, accuracy: 0.81[Train] epoch: 2, step: 1368, loss: 0.29558, accuracy: 0.88[Train] epoch: 2, step: 1369, loss: 0.15109, accuracy: 0.91[Train] epoch: 2, step: 1370, loss: 0.18766, accuracy: 0.94[Train] epoch: 2, step: 1371, loss: 0.12964, accuracy: 0.94[Train] epoch: 2, step: 1372, loss: 0.45517, accuracy: 0.81[Train] epoch: 2, step: 1373, loss: 0.25162, accuracy: 0.91[Train] epoch: 2, step: 1374, loss: 0.15342, accuracy: 0.97[Train] epoch: 2, step: 1375, loss: 0.35007, accuracy: 0.84[Train] epoch: 2, step: 1376, loss: 0.4

[Train] epoch: 2, step: 1630, loss: 0.38960, accuracy: 0.84[Train] epoch: 2, step: 1631, loss: 0.62119, accuracy: 0.78[Train] epoch: 2, step: 1632, loss: 0.04768, accuracy: 1.00[Train] epoch: 2, step: 1633, loss: 0.32947, accuracy: 0.88[Train] epoch: 2, step: 1634, loss: 0.38157, accuracy: 0.81[Train] epoch: 2, step: 1635, loss: 0.20424, accuracy: 0.94[Train] epoch: 2, step: 1636, loss: 0.19554, accuracy: 0.91[Train] epoch: 2, step: 1637, loss: 0.21658, accuracy: 0.97[Train] epoch: 2, step: 1638, loss: 0.20167, accuracy: 0.91[Train] epoch: 2, step: 1639, loss: 0.31251, accuracy: 0.91[Train] epoch: 2, step: 1640, loss: 0.26252, accuracy: 0.91[Train] epoch: 2, step: 1641, loss: 0.09617, accuracy: 0.97[Train] epoch: 2, step: 1642, loss: 0.25187, accuracy: 0.91[Train] epoch: 2, step: 1643, loss: 0.34958, accuracy: 0.88[Train] epoch: 2, step: 1644, loss: 0.32106, accuracy: 0.88[Train] epoch: 2, step: 1645, loss: 0.22370, accuracy: 0.91[Train] epoch: 2, step: 1646, loss: 0.2

[Train] epoch: 3, step: 0, loss: 0.18835, accuracy: 0.97[Train] epoch: 3, step: 1, loss: 0.60643, accuracy: 0.84[Train] epoch: 3, step: 2, loss: 0.27586, accuracy: 0.88[Train] epoch: 3, step: 3, loss: 0.40479, accuracy: 0.81[Train] epoch: 3, step: 4, loss: 0.47072, accuracy: 0.78[Train] epoch: 3, step: 5, loss: 0.43657, accuracy: 0.88[Train] epoch: 3, step: 6, loss: 0.22009, accuracy: 0.91[Train] epoch: 3, step: 7, loss: 0.54488, accuracy: 0.81[Train] epoch: 3, step: 8, loss: 0.31248, accuracy: 0.88[Train] epoch: 3, step: 9, loss: 0.26178, accuracy: 0.84[Train] epoch: 3, step: 10, loss: 0.42636, accuracy: 0.88[Train] epoch: 3, step: 11, loss: 0.45488, accuracy: 0.84[Train] epoch: 3, step: 12, loss: 0.35092, accuracy: 0.88[Train] epoch: 3, step: 13, loss: 0.51956, accuracy: 0.78[Train] epoch: 3, step: 14, loss: 0.23631, accuracy: 0.88[Train] epoch: 3, step: 15, loss: 0.28012, accuracy: 0.88[Train] epoch: 3, step: 16, loss: 0.19052, accuracy: 0.94[Train] epoch: 3, step:

[Train] epoch: 3, step: 405, loss: 0.26100, accuracy: 0.88[Train] epoch: 3, step: 406, loss: 0.48121, accuracy: 0.78[Train] epoch: 3, step: 407, loss: 0.20207, accuracy: 0.91[Train] epoch: 3, step: 408, loss: 0.38948, accuracy: 0.81[Train] epoch: 3, step: 409, loss: 0.38848, accuracy: 0.78[Train] epoch: 3, step: 410, loss: 0.27114, accuracy: 0.91[Train] epoch: 3, step: 411, loss: 0.36105, accuracy: 0.84[Train] epoch: 3, step: 412, loss: 0.48024, accuracy: 0.81[Train] epoch: 3, step: 413, loss: 0.19551, accuracy: 0.91[Train] epoch: 3, step: 414, loss: 0.64195, accuracy: 0.84[Train] epoch: 3, step: 415, loss: 0.36158, accuracy: 0.88[Train] epoch: 3, step: 416, loss: 0.27546, accuracy: 0.88[Train] epoch: 3, step: 417, loss: 0.17636, accuracy: 0.94[Train] epoch: 3, step: 418, loss: 0.57836, accuracy: 0.81[Train] epoch: 3, step: 419, loss: 0.38603, accuracy: 0.88[Train] epoch: 3, step: 420, loss: 0.39214, accuracy: 0.88[Train] epoch: 3, step: 421, loss: 0.26148, accuracy: 0

[Train] epoch: 3, step: 679, loss: 0.30058, accuracy: 0.91[Train] epoch: 3, step: 680, loss: 0.32439, accuracy: 0.88[Train] epoch: 3, step: 681, loss: 0.37173, accuracy: 0.88[Train] epoch: 3, step: 682, loss: 0.17568, accuracy: 0.91[Train] epoch: 3, step: 683, loss: 0.19510, accuracy: 0.94[Train] epoch: 3, step: 684, loss: 0.49330, accuracy: 0.88[Train] epoch: 3, step: 685, loss: 0.22913, accuracy: 0.91[Train] epoch: 3, step: 686, loss: 0.25816, accuracy: 0.94[Train] epoch: 3, step: 687, loss: 0.18150, accuracy: 0.88[Train] epoch: 3, step: 688, loss: 0.21207, accuracy: 0.97[Train] epoch: 3, step: 689, loss: 0.13164, accuracy: 0.97[Train] epoch: 3, step: 690, loss: 0.12646, accuracy: 0.97[Train] epoch: 3, step: 691, loss: 0.52285, accuracy: 0.78[Train] epoch: 3, step: 692, loss: 0.21202, accuracy: 0.94[Train] epoch: 3, step: 693, loss: 0.35386, accuracy: 0.88[Train] epoch: 3, step: 694, loss: 0.27849, accuracy: 0.88[Train] epoch: 3, step: 695, loss: 0.37548, accuracy: 0

[Train] epoch: 3, step: 955, loss: 0.38000, accuracy: 0.88[Train] epoch: 3, step: 956, loss: 0.15425, accuracy: 0.94[Train] epoch: 3, step: 957, loss: 0.48975, accuracy: 0.91[Train] epoch: 3, step: 958, loss: 0.28508, accuracy: 0.91[Train] epoch: 3, step: 959, loss: 0.33301, accuracy: 0.88[Train] epoch: 3, step: 960, loss: 0.23155, accuracy: 0.91[Train] epoch: 3, step: 961, loss: 0.35622, accuracy: 0.84[Train] epoch: 3, step: 962, loss: 0.38123, accuracy: 0.81[Train] epoch: 3, step: 963, loss: 0.34654, accuracy: 0.84[Train] epoch: 3, step: 964, loss: 0.24900, accuracy: 0.94[Train] epoch: 3, step: 965, loss: 0.30628, accuracy: 0.88[Train] epoch: 3, step: 966, loss: 0.17615, accuracy: 0.94[Train] epoch: 3, step: 967, loss: 0.15241, accuracy: 0.94[Train] epoch: 3, step: 968, loss: 0.30056, accuracy: 0.91[Train] epoch: 3, step: 969, loss: 0.32272, accuracy: 0.81[Train] epoch: 3, step: 970, loss: 0.54232, accuracy: 0.84[Train] epoch: 3, step: 971, loss: 0.46014, accuracy: 0

[Train] epoch: 3, step: 1229, loss: 0.52038, accuracy: 0.81[Train] epoch: 3, step: 1230, loss: 0.40217, accuracy: 0.81[Train] epoch: 3, step: 1231, loss: 0.24260, accuracy: 0.84[Train] epoch: 3, step: 1232, loss: 0.25305, accuracy: 0.91[Train] epoch: 3, step: 1233, loss: 0.10093, accuracy: 0.97[Train] epoch: 3, step: 1234, loss: 0.33543, accuracy: 0.81[Train] epoch: 3, step: 1235, loss: 0.31476, accuracy: 0.84[Train] epoch: 3, step: 1236, loss: 0.25970, accuracy: 0.91[Train] epoch: 3, step: 1237, loss: 0.18316, accuracy: 0.91[Train] epoch: 3, step: 1238, loss: 0.28955, accuracy: 0.91[Train] epoch: 3, step: 1239, loss: 0.22059, accuracy: 0.94[Train] epoch: 3, step: 1240, loss: 0.17637, accuracy: 0.91[Train] epoch: 3, step: 1241, loss: 0.40373, accuracy: 0.84[Train] epoch: 3, step: 1242, loss: 0.46093, accuracy: 0.81[Train] epoch: 3, step: 1243, loss: 0.37301, accuracy: 0.88[Train] epoch: 3, step: 1244, loss: 0.62119, accuracy: 0.75[Train] epoch: 3, step: 1245, loss: 0.1

[Train] epoch: 3, step: 1502, loss: 0.21796, accuracy: 0.91[Train] epoch: 3, step: 1503, loss: 0.35452, accuracy: 0.88[Train] epoch: 3, step: 1504, loss: 0.19518, accuracy: 0.97[Train] epoch: 3, step: 1505, loss: 0.37837, accuracy: 0.88[Train] epoch: 3, step: 1506, loss: 0.18867, accuracy: 0.91[Train] epoch: 3, step: 1507, loss: 0.35016, accuracy: 0.88[Train] epoch: 3, step: 1508, loss: 0.30711, accuracy: 0.91[Train] epoch: 3, step: 1509, loss: 0.78009, accuracy: 0.69[Train] epoch: 3, step: 1510, loss: 0.25198, accuracy: 0.88[Train] epoch: 3, step: 1511, loss: 0.25691, accuracy: 0.88[Train] epoch: 3, step: 1512, loss: 0.29539, accuracy: 0.84[Train] epoch: 3, step: 1513, loss: 0.13262, accuracy: 0.97[Train] epoch: 3, step: 1514, loss: 0.29205, accuracy: 0.91[Train] epoch: 3, step: 1515, loss: 0.35091, accuracy: 0.84[Train] epoch: 3, step: 1516, loss: 0.20629, accuracy: 0.94[Train] epoch: 3, step: 1517, loss: 0.43127, accuracy: 0.88[Train] epoch: 3, step: 1518, loss: 0.3

	[Valid] acc: 0.87


[Train] epoch: 4, step: 0, loss: 0.12431, accuracy: 0.97[Train] epoch: 4, step: 1, loss: 0.57300, accuracy: 0.81[Train] epoch: 4, step: 2, loss: 0.29044, accuracy: 0.88[Train] epoch: 4, step: 3, loss: 0.38900, accuracy: 0.81[Train] epoch: 4, step: 4, loss: 0.35790, accuracy: 0.84[Train] epoch: 4, step: 5, loss: 0.40482, accuracy: 0.81[Train] epoch: 4, step: 6, loss: 0.21536, accuracy: 0.94[Train] epoch: 4, step: 7, loss: 0.58436, accuracy: 0.81[Train] epoch: 4, step: 8, loss: 0.28131, accuracy: 0.88[Train] epoch: 4, step: 9, loss: 0.22414, accuracy: 0.91[Train] epoch: 4, step: 10, loss: 0.43016, accuracy: 0.84[Train] epoch: 4, step: 11, loss: 0.24212, accuracy: 0.94[Train] epoch: 4, step: 12, loss: 0.29020, accuracy: 0.91[Train] epoch: 4, step: 13, loss: 0.50152, accuracy: 0.78[Train] epoch: 4, step: 14, loss: 0.25972, accuracy: 0.84[Train] epoch: 4, step: 15, loss: 0.26033, accuracy: 0.88[Train] epoch: 4, step: 16, loss: 0.17291, accuracy: 0.94[Train] epoch: 4, step:

[Train] epoch: 4, step: 552, loss: 0.10847, accuracy: 0.97[Train] epoch: 4, step: 553, loss: 0.31765, accuracy: 0.91[Train] epoch: 4, step: 554, loss: 0.24122, accuracy: 0.94[Train] epoch: 4, step: 555, loss: 0.46353, accuracy: 0.81[Train] epoch: 4, step: 556, loss: 0.25287, accuracy: 0.94[Train] epoch: 4, step: 557, loss: 0.16524, accuracy: 0.94[Train] epoch: 4, step: 558, loss: 0.33118, accuracy: 0.91[Train] epoch: 4, step: 559, loss: 0.24720, accuracy: 0.91[Train] epoch: 4, step: 560, loss: 0.37984, accuracy: 0.88[Train] epoch: 4, step: 561, loss: 0.50074, accuracy: 0.81[Train] epoch: 4, step: 562, loss: 0.24830, accuracy: 0.91[Train] epoch: 4, step: 563, loss: 0.41190, accuracy: 0.84[Train] epoch: 4, step: 564, loss: 0.23403, accuracy: 0.94[Train] epoch: 4, step: 565, loss: 0.20297, accuracy: 0.91[Train] epoch: 4, step: 566, loss: 0.24554, accuracy: 0.88[Train] epoch: 4, step: 567, loss: 0.30332, accuracy: 0.88[Train] epoch: 4, step: 568, loss: 0.40377, accuracy: 0

[Train] epoch: 4, step: 825, loss: 0.20714, accuracy: 0.91[Train] epoch: 4, step: 826, loss: 0.53059, accuracy: 0.84[Train] epoch: 4, step: 827, loss: 0.11579, accuracy: 0.97[Train] epoch: 4, step: 828, loss: 0.28816, accuracy: 0.91[Train] epoch: 4, step: 829, loss: 0.29031, accuracy: 0.88[Train] epoch: 4, step: 830, loss: 0.08899, accuracy: 0.97[Train] epoch: 4, step: 831, loss: 0.19820, accuracy: 0.91[Train] epoch: 4, step: 832, loss: 0.29585, accuracy: 0.88[Train] epoch: 4, step: 833, loss: 0.30042, accuracy: 0.88[Train] epoch: 4, step: 834, loss: 0.54553, accuracy: 0.81[Train] epoch: 4, step: 835, loss: 0.12780, accuracy: 0.97[Train] epoch: 4, step: 836, loss: 0.42628, accuracy: 0.84[Train] epoch: 4, step: 837, loss: 0.10306, accuracy: 0.94[Train] epoch: 4, step: 838, loss: 0.15340, accuracy: 0.97[Train] epoch: 4, step: 839, loss: 0.25329, accuracy: 0.91[Train] epoch: 4, step: 840, loss: 0.14094, accuracy: 0.94[Train] epoch: 4, step: 841, loss: 0.14533, accuracy: 0

[Train] epoch: 4, step: 1100, loss: 0.18440, accuracy: 0.91[Train] epoch: 4, step: 1101, loss: 0.26374, accuracy: 0.88[Train] epoch: 4, step: 1102, loss: 0.23794, accuracy: 0.94[Train] epoch: 4, step: 1103, loss: 0.18682, accuracy: 0.94[Train] epoch: 4, step: 1104, loss: 0.19848, accuracy: 0.97[Train] epoch: 4, step: 1105, loss: 0.40522, accuracy: 0.84[Train] epoch: 4, step: 1106, loss: 0.31922, accuracy: 0.84[Train] epoch: 4, step: 1107, loss: 0.13709, accuracy: 0.97[Train] epoch: 4, step: 1108, loss: 0.21623, accuracy: 0.91[Train] epoch: 4, step: 1109, loss: 0.32489, accuracy: 0.91[Train] epoch: 4, step: 1110, loss: 0.23788, accuracy: 0.91[Train] epoch: 4, step: 1111, loss: 0.25179, accuracy: 0.88[Train] epoch: 4, step: 1112, loss: 0.25900, accuracy: 0.91[Train] epoch: 4, step: 1113, loss: 0.46060, accuracy: 0.84[Train] epoch: 4, step: 1114, loss: 0.05950, accuracy: 1.00[Train] epoch: 4, step: 1115, loss: 0.33908, accuracy: 0.88[Train] epoch: 4, step: 1116, loss: 0.0

[Train] epoch: 4, step: 1377, loss: 0.31244, accuracy: 0.88[Train] epoch: 4, step: 1378, loss: 0.12127, accuracy: 0.97[Train] epoch: 4, step: 1379, loss: 0.19360, accuracy: 0.94[Train] epoch: 4, step: 1380, loss: 0.24453, accuracy: 0.91[Train] epoch: 4, step: 1381, loss: 0.11085, accuracy: 0.97[Train] epoch: 4, step: 1382, loss: 0.25311, accuracy: 0.88[Train] epoch: 4, step: 1383, loss: 0.19247, accuracy: 0.91[Train] epoch: 4, step: 1384, loss: 0.18596, accuracy: 0.94[Train] epoch: 4, step: 1385, loss: 0.41097, accuracy: 0.84[Train] epoch: 4, step: 1386, loss: 0.24119, accuracy: 0.91[Train] epoch: 4, step: 1387, loss: 0.42602, accuracy: 0.78[Train] epoch: 4, step: 1388, loss: 0.46073, accuracy: 0.88[Train] epoch: 4, step: 1389, loss: 0.18689, accuracy: 0.94[Train] epoch: 4, step: 1390, loss: 0.41018, accuracy: 0.81[Train] epoch: 4, step: 1391, loss: 0.09081, accuracy: 0.97[Train] epoch: 4, step: 1392, loss: 0.40150, accuracy: 0.84[Train] epoch: 4, step: 1393, loss: 0.2

[Train] epoch: 4, step: 1655, loss: 0.25954, accuracy: 0.91[Train] epoch: 4, step: 1656, loss: 0.32305, accuracy: 0.84[Train] epoch: 4, step: 1657, loss: 0.30894, accuracy: 0.91[Train] epoch: 4, step: 1658, loss: 0.35373, accuracy: 0.88[Train] epoch: 4, step: 1659, loss: 0.39549, accuracy: 0.81[Train] epoch: 4, step: 1660, loss: 0.14990, accuracy: 0.94[Train] epoch: 4, step: 1661, loss: 0.32422, accuracy: 0.84[Train] epoch: 4, step: 1662, loss: 0.29656, accuracy: 0.88[Train] epoch: 4, step: 1663, loss: 0.13430, accuracy: 0.97[Train] epoch: 4, step: 1664, loss: 0.20758, accuracy: 0.94[Train] epoch: 4, step: 1665, loss: 0.20505, accuracy: 0.91[Train] epoch: 4, step: 1666, loss: 0.45531, accuracy: 0.81[Train] epoch: 4, step: 1667, loss: 0.15337, accuracy: 0.91[Train] epoch: 4, step: 1668, loss: 0.24703, accuracy: 0.91[Train] epoch: 4, step: 1669, loss: 0.28778, accuracy: 0.88[Train] epoch: 4, step: 1670, loss: 0.34207, accuracy: 0.91[Train] epoch: 4, step: 1671, loss: 0.2

[Train] epoch: 5, step: 0, loss: 0.16054, accuracy: 0.97[Train] epoch: 5, step: 1, loss: 0.57058, accuracy: 0.81[Train] epoch: 5, step: 2, loss: 0.31986, accuracy: 0.88[Train] epoch: 5, step: 3, loss: 0.34065, accuracy: 0.84[Train] epoch: 5, step: 4, loss: 0.40360, accuracy: 0.81[Train] epoch: 5, step: 5, loss: 0.53517, accuracy: 0.78[Train] epoch: 5, step: 6, loss: 0.21012, accuracy: 0.94[Train] epoch: 5, step: 7, loss: 0.40804, accuracy: 0.88[Train] epoch: 5, step: 8, loss: 0.23287, accuracy: 0.94[Train] epoch: 5, step: 9, loss: 0.18708, accuracy: 0.94[Train] epoch: 5, step: 10, loss: 0.31124, accuracy: 0.91[Train] epoch: 5, step: 11, loss: 0.39816, accuracy: 0.81[Train] epoch: 5, step: 12, loss: 0.30272, accuracy: 0.88[Train] epoch: 5, step: 13, loss: 0.47955, accuracy: 0.78[Train] epoch: 5, step: 14, loss: 0.24600, accuracy: 0.84[Train] epoch: 5, step: 15, loss: 0.26716, accuracy: 0.88[Train] epoch: 5, step: 16, loss: 0.17469, accuracy: 0.97[Train] epoch: 5, step:

[Train] epoch: 5, step: 426, loss: 0.05467, accuracy: 1.00[Train] epoch: 5, step: 427, loss: 0.30213, accuracy: 0.84[Train] epoch: 5, step: 428, loss: 0.12401, accuracy: 0.97[Train] epoch: 5, step: 429, loss: 0.16779, accuracy: 0.94[Train] epoch: 5, step: 430, loss: 0.15262, accuracy: 0.97[Train] epoch: 5, step: 431, loss: 0.16595, accuracy: 0.94[Train] epoch: 5, step: 432, loss: 0.36249, accuracy: 0.81[Train] epoch: 5, step: 433, loss: 0.35918, accuracy: 0.84[Train] epoch: 5, step: 434, loss: 0.18411, accuracy: 0.94[Train] epoch: 5, step: 435, loss: 0.33640, accuracy: 0.84[Train] epoch: 5, step: 436, loss: 0.11034, accuracy: 1.00[Train] epoch: 5, step: 437, loss: 0.42452, accuracy: 0.88[Train] epoch: 5, step: 438, loss: 0.34459, accuracy: 0.81[Train] epoch: 5, step: 439, loss: 0.39445, accuracy: 0.81[Train] epoch: 5, step: 440, loss: 0.44097, accuracy: 0.88[Train] epoch: 5, step: 441, loss: 0.37155, accuracy: 0.78[Train] epoch: 5, step: 442, loss: 0.18507, accuracy: 0

[Train] epoch: 5, step: 697, loss: 0.16849, accuracy: 0.94[Train] epoch: 5, step: 698, loss: 0.53457, accuracy: 0.91[Train] epoch: 5, step: 699, loss: 0.15517, accuracy: 0.94[Train] epoch: 5, step: 700, loss: 0.16323, accuracy: 0.94[Train] epoch: 5, step: 701, loss: 0.22173, accuracy: 0.91[Train] epoch: 5, step: 702, loss: 0.08952, accuracy: 0.97[Train] epoch: 5, step: 703, loss: 0.22809, accuracy: 0.88[Train] epoch: 5, step: 704, loss: 0.31493, accuracy: 0.81[Train] epoch: 5, step: 705, loss: 0.29306, accuracy: 0.91[Train] epoch: 5, step: 706, loss: 0.45994, accuracy: 0.84[Train] epoch: 5, step: 707, loss: 0.29304, accuracy: 0.91[Train] epoch: 5, step: 708, loss: 0.37833, accuracy: 0.84[Train] epoch: 5, step: 709, loss: 0.24163, accuracy: 0.91[Train] epoch: 5, step: 710, loss: 0.25277, accuracy: 0.88[Train] epoch: 5, step: 711, loss: 0.27937, accuracy: 0.91[Train] epoch: 5, step: 712, loss: 0.33761, accuracy: 0.84[Train] epoch: 5, step: 713, loss: 0.09904, accuracy: 0

[Train] epoch: 5, step: 972, loss: 0.15860, accuracy: 0.94[Train] epoch: 5, step: 973, loss: 0.24459, accuracy: 0.88[Train] epoch: 5, step: 974, loss: 0.17507, accuracy: 0.91[Train] epoch: 5, step: 975, loss: 0.17361, accuracy: 0.88[Train] epoch: 5, step: 976, loss: 0.32770, accuracy: 0.81[Train] epoch: 5, step: 977, loss: 0.35578, accuracy: 0.91[Train] epoch: 5, step: 978, loss: 0.58887, accuracy: 0.81[Train] epoch: 5, step: 979, loss: 0.10872, accuracy: 0.97[Train] epoch: 5, step: 980, loss: 0.20384, accuracy: 0.94[Train] epoch: 5, step: 981, loss: 0.29087, accuracy: 0.88[Train] epoch: 5, step: 982, loss: 0.49990, accuracy: 0.81[Train] epoch: 5, step: 983, loss: 0.41249, accuracy: 0.81[Train] epoch: 5, step: 984, loss: 0.44967, accuracy: 0.84[Train] epoch: 5, step: 985, loss: 0.29182, accuracy: 0.88[Train] epoch: 5, step: 986, loss: 0.21195, accuracy: 0.91[Train] epoch: 5, step: 987, loss: 0.18146, accuracy: 0.88[Train] epoch: 5, step: 988, loss: 0.34350, accuracy: 0

[Train] epoch: 5, step: 1244, loss: 0.46824, accuracy: 0.78[Train] epoch: 5, step: 1245, loss: 0.18801, accuracy: 0.91[Train] epoch: 5, step: 1246, loss: 0.37006, accuracy: 0.94[Train] epoch: 5, step: 1247, loss: 0.43441, accuracy: 0.81[Train] epoch: 5, step: 1248, loss: 0.29448, accuracy: 0.84[Train] epoch: 5, step: 1249, loss: 0.10631, accuracy: 0.94[Train] epoch: 5, step: 1250, loss: 0.24117, accuracy: 0.91[Train] epoch: 5, step: 1251, loss: 0.25220, accuracy: 0.88[Train] epoch: 5, step: 1252, loss: 0.30461, accuracy: 0.84[Train] epoch: 5, step: 1253, loss: 0.25403, accuracy: 0.88[Train] epoch: 5, step: 1254, loss: 0.21385, accuracy: 0.94[Train] epoch: 5, step: 1255, loss: 0.24909, accuracy: 0.91[Train] epoch: 5, step: 1256, loss: 0.46759, accuracy: 0.81[Train] epoch: 5, step: 1257, loss: 0.20826, accuracy: 0.91[Train] epoch: 5, step: 1258, loss: 0.31924, accuracy: 0.88[Train] epoch: 5, step: 1259, loss: 0.17165, accuracy: 0.97[Train] epoch: 5, step: 1260, loss: 0.2

[Train] epoch: 5, step: 1519, loss: 0.16260, accuracy: 0.94[Train] epoch: 5, step: 1520, loss: 0.32578, accuracy: 0.88[Train] epoch: 5, step: 1521, loss: 0.33597, accuracy: 0.88[Train] epoch: 5, step: 1522, loss: 0.13196, accuracy: 0.94[Train] epoch: 5, step: 1523, loss: 0.34254, accuracy: 0.91[Train] epoch: 5, step: 1524, loss: 0.14818, accuracy: 0.97[Train] epoch: 5, step: 1525, loss: 0.20743, accuracy: 0.91[Train] epoch: 5, step: 1526, loss: 0.17268, accuracy: 0.91[Train] epoch: 5, step: 1527, loss: 0.63723, accuracy: 0.81[Train] epoch: 5, step: 1528, loss: 0.28432, accuracy: 0.88[Train] epoch: 5, step: 1529, loss: 0.11478, accuracy: 1.00[Train] epoch: 5, step: 1530, loss: 0.27042, accuracy: 0.88[Train] epoch: 5, step: 1531, loss: 0.12752, accuracy: 0.94[Train] epoch: 5, step: 1532, loss: 0.32770, accuracy: 0.88[Train] epoch: 5, step: 1533, loss: 0.40982, accuracy: 0.81[Train] epoch: 5, step: 1534, loss: 0.27320, accuracy: 0.84[Train] epoch: 5, step: 1535, loss: 0.2

[Train] epoch: 6, step: 0, loss: 0.10202, accuracy: 1.00[Train] epoch: 6, step: 1, loss: 0.45399, accuracy: 0.88[Train] epoch: 6, step: 2, loss: 0.35253, accuracy: 0.91[Train] epoch: 6, step: 3, loss: 0.45064, accuracy: 0.78[Train] epoch: 6, step: 4, loss: 0.34717, accuracy: 0.88[Train] epoch: 6, step: 5, loss: 0.41305, accuracy: 0.81[Train] epoch: 6, step: 6, loss: 0.19779, accuracy: 0.91[Train] epoch: 6, step: 7, loss: 0.37678, accuracy: 0.84[Train] epoch: 6, step: 8, loss: 0.19868, accuracy: 0.94[Train] epoch: 6, step: 9, loss: 0.18150, accuracy: 0.97[Train] epoch: 6, step: 10, loss: 0.30033, accuracy: 0.88[Train] epoch: 6, step: 11, loss: 0.36187, accuracy: 0.78[Train] epoch: 6, step: 12, loss: 0.28839, accuracy: 0.91[Train] epoch: 6, step: 13, loss: 0.44589, accuracy: 0.84[Train] epoch: 6, step: 14, loss: 0.21314, accuracy: 0.88[Train] epoch: 6, step: 15, loss: 0.25794, accuracy: 0.91[Train] epoch: 6, step: 16, loss: 0.16183, accuracy: 0.94[Train] epoch: 6, step:

[Train] epoch: 6, step: 289, loss: 0.29045, accuracy: 0.81[Train] epoch: 6, step: 290, loss: 0.13819, accuracy: 0.94[Train] epoch: 6, step: 291, loss: 0.57362, accuracy: 0.72[Train] epoch: 6, step: 292, loss: 0.15166, accuracy: 0.94[Train] epoch: 6, step: 293, loss: 0.12060, accuracy: 0.97[Train] epoch: 6, step: 294, loss: 0.36576, accuracy: 0.88[Train] epoch: 6, step: 295, loss: 0.29266, accuracy: 0.94[Train] epoch: 6, step: 296, loss: 0.43372, accuracy: 0.84[Train] epoch: 6, step: 297, loss: 0.14397, accuracy: 1.00[Train] epoch: 6, step: 298, loss: 0.21336, accuracy: 0.94[Train] epoch: 6, step: 299, loss: 0.16404, accuracy: 0.91[Train] epoch: 6, step: 300, loss: 0.29119, accuracy: 0.91[Train] epoch: 6, step: 301, loss: 0.31490, accuracy: 0.88[Train] epoch: 6, step: 302, loss: 0.43491, accuracy: 0.81[Train] epoch: 6, step: 303, loss: 0.18394, accuracy: 0.91[Train] epoch: 6, step: 304, loss: 0.21619, accuracy: 0.91[Train] epoch: 6, step: 305, loss: 0.18287, accuracy: 0

[Train] epoch: 6, step: 568, loss: 0.35569, accuracy: 0.84[Train] epoch: 6, step: 569, loss: 0.30315, accuracy: 0.88[Train] epoch: 6, step: 570, loss: 0.19416, accuracy: 0.97[Train] epoch: 6, step: 571, loss: 0.15036, accuracy: 0.97[Train] epoch: 6, step: 572, loss: 0.19313, accuracy: 0.97[Train] epoch: 6, step: 573, loss: 0.40557, accuracy: 0.88[Train] epoch: 6, step: 574, loss: 0.12810, accuracy: 0.94[Train] epoch: 6, step: 575, loss: 0.13887, accuracy: 0.97[Train] epoch: 6, step: 576, loss: 0.23766, accuracy: 0.94[Train] epoch: 6, step: 577, loss: 0.35404, accuracy: 0.91[Train] epoch: 6, step: 578, loss: 0.13538, accuracy: 0.97[Train] epoch: 6, step: 579, loss: 0.22000, accuracy: 0.88[Train] epoch: 6, step: 580, loss: 0.35881, accuracy: 0.88[Train] epoch: 6, step: 581, loss: 0.25623, accuracy: 0.88[Train] epoch: 6, step: 582, loss: 0.16177, accuracy: 0.97[Train] epoch: 6, step: 583, loss: 0.19095, accuracy: 0.88[Train] epoch: 6, step: 584, loss: 0.20947, accuracy: 0

[Train] epoch: 6, step: 846, loss: 0.39431, accuracy: 0.81[Train] epoch: 6, step: 847, loss: 0.13242, accuracy: 0.97[Train] epoch: 6, step: 848, loss: 0.17038, accuracy: 0.91[Train] epoch: 6, step: 849, loss: 0.13099, accuracy: 0.97[Train] epoch: 6, step: 850, loss: 0.26298, accuracy: 0.81[Train] epoch: 6, step: 851, loss: 0.38020, accuracy: 0.88[Train] epoch: 6, step: 852, loss: 0.22530, accuracy: 0.84[Train] epoch: 6, step: 853, loss: 0.35499, accuracy: 0.88[Train] epoch: 6, step: 854, loss: 0.11865, accuracy: 0.97[Train] epoch: 6, step: 855, loss: 0.26016, accuracy: 0.88[Train] epoch: 6, step: 856, loss: 0.38036, accuracy: 0.91[Train] epoch: 6, step: 857, loss: 0.20107, accuracy: 0.91[Train] epoch: 6, step: 858, loss: 0.16745, accuracy: 0.91[Train] epoch: 6, step: 859, loss: 0.17355, accuracy: 0.94[Train] epoch: 6, step: 860, loss: 0.03590, accuracy: 1.00[Train] epoch: 6, step: 861, loss: 0.14880, accuracy: 0.94[Train] epoch: 6, step: 862, loss: 0.16038, accuracy: 0

[Train] epoch: 6, step: 1120, loss: 0.28916, accuracy: 0.94[Train] epoch: 6, step: 1121, loss: 0.28553, accuracy: 0.88[Train] epoch: 6, step: 1122, loss: 0.10326, accuracy: 0.97[Train] epoch: 6, step: 1123, loss: 0.23882, accuracy: 0.94[Train] epoch: 6, step: 1124, loss: 0.11920, accuracy: 0.94[Train] epoch: 6, step: 1125, loss: 0.16695, accuracy: 0.94[Train] epoch: 6, step: 1126, loss: 0.15246, accuracy: 0.91[Train] epoch: 6, step: 1127, loss: 0.19646, accuracy: 0.91[Train] epoch: 6, step: 1128, loss: 0.10674, accuracy: 1.00[Train] epoch: 6, step: 1129, loss: 0.29333, accuracy: 0.91[Train] epoch: 6, step: 1130, loss: 0.29752, accuracy: 0.91[Train] epoch: 6, step: 1131, loss: 0.20963, accuracy: 0.94[Train] epoch: 6, step: 1132, loss: 0.17691, accuracy: 0.97[Train] epoch: 6, step: 1133, loss: 0.05852, accuracy: 1.00[Train] epoch: 6, step: 1134, loss: 0.38881, accuracy: 0.84[Train] epoch: 6, step: 1135, loss: 0.13822, accuracy: 0.91[Train] epoch: 6, step: 1136, loss: 0.4

[Train] epoch: 6, step: 1401, loss: 0.09114, accuracy: 0.94[Train] epoch: 6, step: 1402, loss: 0.27172, accuracy: 0.81[Train] epoch: 6, step: 1403, loss: 0.18301, accuracy: 0.94[Train] epoch: 6, step: 1404, loss: 0.28353, accuracy: 0.91[Train] epoch: 6, step: 1405, loss: 0.40130, accuracy: 0.91[Train] epoch: 6, step: 1406, loss: 0.55452, accuracy: 0.88[Train] epoch: 6, step: 1407, loss: 0.40522, accuracy: 0.81[Train] epoch: 6, step: 1408, loss: 0.13358, accuracy: 0.97[Train] epoch: 6, step: 1409, loss: 0.20574, accuracy: 0.88[Train] epoch: 6, step: 1410, loss: 0.39346, accuracy: 0.88[Train] epoch: 6, step: 1411, loss: 0.19418, accuracy: 0.94[Train] epoch: 6, step: 1412, loss: 0.18089, accuracy: 0.91[Train] epoch: 6, step: 1413, loss: 0.23539, accuracy: 0.94[Train] epoch: 6, step: 1414, loss: 0.28358, accuracy: 0.88[Train] epoch: 6, step: 1415, loss: 0.18481, accuracy: 0.94[Train] epoch: 6, step: 1416, loss: 0.23654, accuracy: 0.91[Train] epoch: 6, step: 1417, loss: 0.2

[Train] epoch: 6, step: 1680, loss: 0.25758, accuracy: 0.91[Train] epoch: 6, step: 1681, loss: 0.19697, accuracy: 0.97[Train] epoch: 6, step: 1682, loss: 0.26523, accuracy: 0.88[Train] epoch: 6, step: 1683, loss: 0.22714, accuracy: 0.94[Train] epoch: 6, step: 1684, loss: 0.29844, accuracy: 0.91[Train] epoch: 6, step: 1685, loss: 0.15597, accuracy: 0.94[Train] epoch: 6, step: 1686, loss: 0.29068, accuracy: 0.91[Train] epoch: 6, step: 1687, loss: 0.28473, accuracy: 0.88[Train] epoch: 6, step: 1688, loss: 0.13663, accuracy: 0.97[Train] epoch: 6, step: 1689, loss: 0.16827, accuracy: 0.97[Train] epoch: 6, step: 1690, loss: 0.11475, accuracy: 0.94[Train] epoch: 6, step: 1691, loss: 0.18825, accuracy: 0.91[Train] epoch: 6, step: 1692, loss: 0.17170, accuracy: 0.94[Train] epoch: 6, step: 1693, loss: 0.42951, accuracy: 0.81[Train] epoch: 6, step: 1694, loss: 0.14634, accuracy: 0.94[Train] epoch: 6, step: 1695, loss: 0.34757, accuracy: 0.81[Train] epoch: 6, step: 1696, loss: 0.3

[Train] epoch: 7, step: 0, loss: 0.13600, accuracy: 0.97[Train] epoch: 7, step: 1, loss: 0.48155, accuracy: 0.84[Train] epoch: 7, step: 2, loss: 0.26004, accuracy: 0.88[Train] epoch: 7, step: 3, loss: 0.39896, accuracy: 0.75[Train] epoch: 7, step: 4, loss: 0.32815, accuracy: 0.84[Train] epoch: 7, step: 5, loss: 0.39669, accuracy: 0.81[Train] epoch: 7, step: 6, loss: 0.20822, accuracy: 0.94[Train] epoch: 7, step: 7, loss: 0.31787, accuracy: 0.84[Train] epoch: 7, step: 8, loss: 0.32334, accuracy: 0.88[Train] epoch: 7, step: 9, loss: 0.21065, accuracy: 0.91[Train] epoch: 7, step: 10, loss: 0.27183, accuracy: 0.88[Train] epoch: 7, step: 11, loss: 0.40139, accuracy: 0.84[Train] epoch: 7, step: 12, loss: 0.24000, accuracy: 0.97[Train] epoch: 7, step: 13, loss: 0.41863, accuracy: 0.84[Train] epoch: 7, step: 14, loss: 0.17264, accuracy: 0.91[Train] epoch: 7, step: 15, loss: 0.26425, accuracy: 0.94[Train] epoch: 7, step: 16, loss: 0.19195, accuracy: 0.91[Train] epoch: 7, step:

[Train] epoch: 7, step: 456, loss: 0.21100, accuracy: 0.97[Train] epoch: 7, step: 457, loss: 0.14464, accuracy: 0.94[Train] epoch: 7, step: 458, loss: 0.07975, accuracy: 0.97[Train] epoch: 7, step: 459, loss: 0.36329, accuracy: 0.84[Train] epoch: 7, step: 460, loss: 0.08856, accuracy: 0.97[Train] epoch: 7, step: 461, loss: 0.09443, accuracy: 0.97[Train] epoch: 7, step: 462, loss: 0.43658, accuracy: 0.88[Train] epoch: 7, step: 463, loss: 0.29224, accuracy: 0.91[Train] epoch: 7, step: 464, loss: 0.21116, accuracy: 0.91[Train] epoch: 7, step: 465, loss: 0.22805, accuracy: 0.94[Train] epoch: 7, step: 466, loss: 0.14211, accuracy: 0.97[Train] epoch: 7, step: 467, loss: 0.17212, accuracy: 0.94[Train] epoch: 7, step: 468, loss: 0.33891, accuracy: 0.84[Train] epoch: 7, step: 469, loss: 0.25369, accuracy: 0.88[Train] epoch: 7, step: 470, loss: 0.16755, accuracy: 0.91[Train] epoch: 7, step: 471, loss: 0.41036, accuracy: 0.81[Train] epoch: 7, step: 472, loss: 0.18897, accuracy: 0

[Train] epoch: 7, step: 732, loss: 0.09540, accuracy: 0.97[Train] epoch: 7, step: 733, loss: 0.22784, accuracy: 0.91[Train] epoch: 7, step: 734, loss: 0.26724, accuracy: 0.91[Train] epoch: 7, step: 735, loss: 0.08669, accuracy: 0.94[Train] epoch: 7, step: 736, loss: 0.23894, accuracy: 0.94[Train] epoch: 7, step: 737, loss: 0.05771, accuracy: 0.97[Train] epoch: 7, step: 738, loss: 0.52414, accuracy: 0.81[Train] epoch: 7, step: 739, loss: 0.19474, accuracy: 0.91[Train] epoch: 7, step: 740, loss: 0.28970, accuracy: 0.94[Train] epoch: 7, step: 741, loss: 0.15679, accuracy: 0.97[Train] epoch: 7, step: 742, loss: 0.23726, accuracy: 0.94[Train] epoch: 7, step: 743, loss: 0.34705, accuracy: 0.84[Train] epoch: 7, step: 744, loss: 0.24053, accuracy: 0.88[Train] epoch: 7, step: 745, loss: 0.28900, accuracy: 0.88[Train] epoch: 7, step: 746, loss: 0.20935, accuracy: 0.91[Train] epoch: 7, step: 747, loss: 0.26592, accuracy: 0.88[Train] epoch: 7, step: 748, loss: 0.25158, accuracy: 0

[Train] epoch: 7, step: 1010, loss: 0.09432, accuracy: 0.94[Train] epoch: 7, step: 1011, loss: 0.22177, accuracy: 0.94[Train] epoch: 7, step: 1012, loss: 0.14041, accuracy: 0.94[Train] epoch: 7, step: 1013, loss: 0.21151, accuracy: 0.94[Train] epoch: 7, step: 1014, loss: 0.13484, accuracy: 0.91[Train] epoch: 7, step: 1015, loss: 0.23037, accuracy: 0.94[Train] epoch: 7, step: 1016, loss: 0.11150, accuracy: 0.94[Train] epoch: 7, step: 1017, loss: 0.18172, accuracy: 0.94[Train] epoch: 7, step: 1018, loss: 0.15577, accuracy: 0.94[Train] epoch: 7, step: 1019, loss: 0.10473, accuracy: 1.00[Train] epoch: 7, step: 1020, loss: 0.15319, accuracy: 0.94[Train] epoch: 7, step: 1021, loss: 0.29354, accuracy: 0.88[Train] epoch: 7, step: 1022, loss: 0.30480, accuracy: 0.84[Train] epoch: 7, step: 1023, loss: 0.14696, accuracy: 0.91[Train] epoch: 7, step: 1024, loss: 0.11153, accuracy: 0.97[Train] epoch: 7, step: 1025, loss: 0.11868, accuracy: 0.91[Train] epoch: 7, step: 1026, loss: 0.1

[Train] epoch: 7, step: 1288, loss: 0.13439, accuracy: 0.97[Train] epoch: 7, step: 1289, loss: 0.28188, accuracy: 0.91[Train] epoch: 7, step: 1290, loss: 0.33031, accuracy: 0.88[Train] epoch: 7, step: 1291, loss: 0.14679, accuracy: 0.94[Train] epoch: 7, step: 1292, loss: 0.26572, accuracy: 0.97[Train] epoch: 7, step: 1293, loss: 0.18769, accuracy: 0.94[Train] epoch: 7, step: 1294, loss: 0.19788, accuracy: 0.88[Train] epoch: 7, step: 1295, loss: 0.21496, accuracy: 0.94[Train] epoch: 7, step: 1296, loss: 0.11403, accuracy: 0.94[Train] epoch: 7, step: 1297, loss: 0.18953, accuracy: 0.91[Train] epoch: 7, step: 1298, loss: 0.21599, accuracy: 0.91[Train] epoch: 7, step: 1299, loss: 0.08824, accuracy: 1.00[Train] epoch: 7, step: 1300, loss: 0.28585, accuracy: 0.88[Train] epoch: 7, step: 1301, loss: 0.20670, accuracy: 0.94[Train] epoch: 7, step: 1302, loss: 0.10375, accuracy: 0.97[Train] epoch: 7, step: 1303, loss: 0.11090, accuracy: 0.97[Train] epoch: 7, step: 1304, loss: 0.1

[Train] epoch: 7, step: 1563, loss: 0.27507, accuracy: 0.88[Train] epoch: 7, step: 1564, loss: 0.26557, accuracy: 0.91[Train] epoch: 7, step: 1565, loss: 0.04846, accuracy: 1.00[Train] epoch: 7, step: 1566, loss: 0.21547, accuracy: 0.91[Train] epoch: 7, step: 1567, loss: 0.14236, accuracy: 0.94[Train] epoch: 7, step: 1568, loss: 0.18525, accuracy: 0.91[Train] epoch: 7, step: 1569, loss: 0.21567, accuracy: 0.88[Train] epoch: 7, step: 1570, loss: 0.38031, accuracy: 0.91[Train] epoch: 7, step: 1571, loss: 0.21673, accuracy: 0.97[Train] epoch: 7, step: 1572, loss: 0.16450, accuracy: 0.94[Train] epoch: 7, step: 1573, loss: 0.31318, accuracy: 0.91[Train] epoch: 7, step: 1574, loss: 0.30826, accuracy: 0.91[Train] epoch: 7, step: 1575, loss: 0.16121, accuracy: 0.97[Train] epoch: 7, step: 1576, loss: 0.20137, accuracy: 0.94[Train] epoch: 7, step: 1577, loss: 0.35459, accuracy: 0.78[Train] epoch: 7, step: 1578, loss: 0.08627, accuracy: 0.97[Train] epoch: 7, step: 1579, loss: 0.3

[Train] epoch: 8, step: 0, loss: 0.14269, accuracy: 0.94[Train] epoch: 8, step: 1, loss: 0.35632, accuracy: 0.91[Train] epoch: 8, step: 2, loss: 0.24796, accuracy: 0.91[Train] epoch: 8, step: 3, loss: 0.36155, accuracy: 0.78[Train] epoch: 8, step: 4, loss: 0.31048, accuracy: 0.88[Train] epoch: 8, step: 5, loss: 0.34040, accuracy: 0.84[Train] epoch: 8, step: 6, loss: 0.17696, accuracy: 0.94[Train] epoch: 8, step: 7, loss: 0.34429, accuracy: 0.88[Train] epoch: 8, step: 8, loss: 0.32236, accuracy: 0.78[Train] epoch: 8, step: 9, loss: 0.20661, accuracy: 0.94[Train] epoch: 8, step: 10, loss: 0.31146, accuracy: 0.81[Train] epoch: 8, step: 11, loss: 0.23800, accuracy: 0.91[Train] epoch: 8, step: 12, loss: 0.21959, accuracy: 0.97[Train] epoch: 8, step: 13, loss: 0.37783, accuracy: 0.84[Train] epoch: 8, step: 14, loss: 0.16338, accuracy: 0.94[Train] epoch: 8, step: 15, loss: 0.26491, accuracy: 0.91[Train] epoch: 8, step: 16, loss: 0.13724, accuracy: 0.97[Train] epoch: 8, step:

[Train] epoch: 8, step: 330, loss: 0.23723, accuracy: 0.91[Train] epoch: 8, step: 331, loss: 0.17786, accuracy: 0.94[Train] epoch: 8, step: 332, loss: 0.08558, accuracy: 1.00[Train] epoch: 8, step: 333, loss: 0.36835, accuracy: 0.97[Train] epoch: 8, step: 334, loss: 0.10697, accuracy: 0.94[Train] epoch: 8, step: 335, loss: 0.38843, accuracy: 0.88[Train] epoch: 8, step: 336, loss: 0.12380, accuracy: 0.97[Train] epoch: 8, step: 337, loss: 0.10860, accuracy: 0.94[Train] epoch: 8, step: 338, loss: 0.19045, accuracy: 0.97[Train] epoch: 8, step: 339, loss: 0.03899, accuracy: 0.97[Train] epoch: 8, step: 340, loss: 0.16030, accuracy: 0.97[Train] epoch: 8, step: 341, loss: 0.17709, accuracy: 0.94[Train] epoch: 8, step: 342, loss: 0.28610, accuracy: 0.94[Train] epoch: 8, step: 343, loss: 0.32787, accuracy: 0.94[Train] epoch: 8, step: 344, loss: 0.12622, accuracy: 0.97[Train] epoch: 8, step: 345, loss: 0.18740, accuracy: 0.94[Train] epoch: 8, step: 346, loss: 0.08547, accuracy: 0

[Train] epoch: 8, step: 607, loss: 0.29167, accuracy: 0.91[Train] epoch: 8, step: 608, loss: 0.11156, accuracy: 0.94[Train] epoch: 8, step: 609, loss: 0.22746, accuracy: 0.94[Train] epoch: 8, step: 610, loss: 0.15055, accuracy: 0.94[Train] epoch: 8, step: 611, loss: 0.33198, accuracy: 0.88[Train] epoch: 8, step: 612, loss: 0.27624, accuracy: 0.91[Train] epoch: 8, step: 613, loss: 0.21881, accuracy: 0.94[Train] epoch: 8, step: 614, loss: 0.10800, accuracy: 0.97[Train] epoch: 8, step: 615, loss: 0.02374, accuracy: 1.00[Train] epoch: 8, step: 616, loss: 0.25020, accuracy: 0.88[Train] epoch: 8, step: 617, loss: 0.07997, accuracy: 0.97[Train] epoch: 8, step: 618, loss: 0.27188, accuracy: 0.91[Train] epoch: 8, step: 619, loss: 0.19652, accuracy: 0.94[Train] epoch: 8, step: 620, loss: 0.29764, accuracy: 0.91[Train] epoch: 8, step: 621, loss: 0.27462, accuracy: 0.88[Train] epoch: 8, step: 622, loss: 0.03747, accuracy: 1.00[Train] epoch: 8, step: 623, loss: 0.18171, accuracy: 0

[Train] epoch: 8, step: 880, loss: 0.08800, accuracy: 0.97[Train] epoch: 8, step: 881, loss: 0.15383, accuracy: 0.97[Train] epoch: 8, step: 882, loss: 0.31842, accuracy: 0.91[Train] epoch: 8, step: 883, loss: 0.26463, accuracy: 0.88[Train] epoch: 8, step: 884, loss: 0.25228, accuracy: 0.81[Train] epoch: 8, step: 885, loss: 0.02141, accuracy: 1.00[Train] epoch: 8, step: 886, loss: 0.16752, accuracy: 0.94[Train] epoch: 8, step: 887, loss: 0.21992, accuracy: 0.91[Train] epoch: 8, step: 888, loss: 0.41517, accuracy: 0.75[Train] epoch: 8, step: 889, loss: 0.12271, accuracy: 0.94[Train] epoch: 8, step: 890, loss: 0.43277, accuracy: 0.84[Train] epoch: 8, step: 891, loss: 0.46453, accuracy: 0.78[Train] epoch: 8, step: 892, loss: 0.15068, accuracy: 0.94[Train] epoch: 8, step: 893, loss: 0.55393, accuracy: 0.84[Train] epoch: 8, step: 894, loss: 0.11067, accuracy: 0.94[Train] epoch: 8, step: 895, loss: 0.31664, accuracy: 0.84[Train] epoch: 8, step: 896, loss: 0.15648, accuracy: 0

[Train] epoch: 8, step: 1157, loss: 0.18003, accuracy: 0.94[Train] epoch: 8, step: 1158, loss: 0.22990, accuracy: 0.88[Train] epoch: 8, step: 1159, loss: 0.36117, accuracy: 0.88[Train] epoch: 8, step: 1160, loss: 0.27135, accuracy: 0.91[Train] epoch: 8, step: 1161, loss: 0.26889, accuracy: 0.94[Train] epoch: 8, step: 1162, loss: 0.06575, accuracy: 0.97[Train] epoch: 8, step: 1163, loss: 0.16491, accuracy: 0.94[Train] epoch: 8, step: 1164, loss: 0.30919, accuracy: 0.88[Train] epoch: 8, step: 1165, loss: 0.35834, accuracy: 0.91[Train] epoch: 8, step: 1166, loss: 0.17319, accuracy: 0.91[Train] epoch: 8, step: 1167, loss: 0.12977, accuracy: 0.94[Train] epoch: 8, step: 1168, loss: 0.19626, accuracy: 0.91[Train] epoch: 8, step: 1169, loss: 0.13860, accuracy: 0.94[Train] epoch: 8, step: 1170, loss: 0.20637, accuracy: 0.91[Train] epoch: 8, step: 1171, loss: 0.14837, accuracy: 0.94[Train] epoch: 8, step: 1172, loss: 0.44498, accuracy: 0.84[Train] epoch: 8, step: 1173, loss: 0.0

[Train] epoch: 8, step: 1433, loss: 0.35389, accuracy: 0.81[Train] epoch: 8, step: 1434, loss: 0.34987, accuracy: 0.91[Train] epoch: 8, step: 1435, loss: 0.07517, accuracy: 0.97[Train] epoch: 8, step: 1436, loss: 0.18691, accuracy: 0.91[Train] epoch: 8, step: 1437, loss: 0.38161, accuracy: 0.81[Train] epoch: 8, step: 1438, loss: 0.19540, accuracy: 0.94[Train] epoch: 8, step: 1439, loss: 0.16954, accuracy: 0.94[Train] epoch: 8, step: 1440, loss: 0.09166, accuracy: 1.00[Train] epoch: 8, step: 1441, loss: 0.15816, accuracy: 0.94[Train] epoch: 8, step: 1442, loss: 0.16099, accuracy: 0.94[Train] epoch: 8, step: 1443, loss: 0.19495, accuracy: 0.94[Train] epoch: 8, step: 1444, loss: 0.21496, accuracy: 0.91[Train] epoch: 8, step: 1445, loss: 0.20372, accuracy: 0.91[Train] epoch: 8, step: 1446, loss: 0.14117, accuracy: 0.97[Train] epoch: 8, step: 1447, loss: 0.15232, accuracy: 0.97[Train] epoch: 8, step: 1448, loss: 0.38403, accuracy: 0.88[Train] epoch: 8, step: 1449, loss: 0.1

[Train] epoch: 8, step: 1711, loss: 0.19159, accuracy: 0.88[Train] epoch: 8, step: 1712, loss: 0.04305, accuracy: 1.00[Train] epoch: 8, step: 1713, loss: 0.03998, accuracy: 1.00[Train] epoch: 8, step: 1714, loss: 0.10569, accuracy: 1.00[Train] epoch: 8, step: 1715, loss: 0.48475, accuracy: 0.84[Train] epoch: 8, step: 1716, loss: 0.05384, accuracy: 1.00[Train] epoch: 8, step: 1717, loss: 0.17004, accuracy: 0.91	[Valid] acc: 0.88


[Train] epoch: 9, step: 0, loss: 0.16693, accuracy: 0.91[Train] epoch: 9, step: 1, loss: 0.30939, accuracy: 0.91[Train] epoch: 9, step: 2, loss: 0.25457, accuracy: 0.88[Train] epoch: 9, step: 3, loss: 0.47784, accuracy: 0.78[Train] epoch: 9, step: 4, loss: 0.24064, accuracy: 0.94[Train] epoch: 9, step: 5, loss: 0.31975, accuracy: 0.81[Train] epoch: 9, step: 6, loss: 0.20201, accuracy: 0.91[Train] epoch: 9, step: 7, loss: 0.23229, accuracy: 0.88[Train] epoch: 9, step: 8, loss: 0.21426, accuracy: 0.91[Train] epoch: 9, step: 9, loss: 0.13815, accuracy: 0.94[Train] epoch: 9, step: 10, loss: 0.27344, accuracy: 0.88[Train] epoch: 9, step: 11, loss: 0.24079, accuracy: 0.88[Train] epoch: 9, step: 12, loss: 0.14937, accuracy: 1.00[Train] epoch: 9, step: 13, loss: 0.38253, accuracy: 0.84[Train] epoch: 9, step: 14, loss: 0.09797, accuracy: 1.00[Train] epoch: 9, step: 15, loss: 0.29182, accuracy: 0.84[Train] epoch: 9, step: 16, loss: 0.14734, accuracy: 0.94[Train] epoch: 9, step:

[Train] epoch: 9, step: 477, loss: 0.24136, accuracy: 0.94[Train] epoch: 9, step: 478, loss: 0.26300, accuracy: 0.91[Train] epoch: 9, step: 479, loss: 0.16265, accuracy: 0.91[Train] epoch: 9, step: 480, loss: 0.10894, accuracy: 0.97[Train] epoch: 9, step: 481, loss: 0.11694, accuracy: 0.97[Train] epoch: 9, step: 482, loss: 0.11494, accuracy: 0.94[Train] epoch: 9, step: 483, loss: 0.34331, accuracy: 0.94[Train] epoch: 9, step: 484, loss: 0.07146, accuracy: 1.00[Train] epoch: 9, step: 485, loss: 0.31520, accuracy: 0.91[Train] epoch: 9, step: 486, loss: 0.20034, accuracy: 0.91[Train] epoch: 9, step: 487, loss: 0.21916, accuracy: 0.94[Train] epoch: 9, step: 488, loss: 0.12982, accuracy: 0.97[Train] epoch: 9, step: 489, loss: 0.24602, accuracy: 0.84[Train] epoch: 9, step: 490, loss: 0.20240, accuracy: 0.94[Train] epoch: 9, step: 491, loss: 0.14106, accuracy: 0.94[Train] epoch: 9, step: 492, loss: 0.32135, accuracy: 0.84[Train] epoch: 9, step: 493, loss: 0.16109, accuracy: 0

[Train] epoch: 9, step: 746, loss: 0.14566, accuracy: 0.91[Train] epoch: 9, step: 747, loss: 0.26374, accuracy: 0.91[Train] epoch: 9, step: 748, loss: 0.32333, accuracy: 0.88[Train] epoch: 9, step: 749, loss: 0.13489, accuracy: 0.97[Train] epoch: 9, step: 750, loss: 0.14559, accuracy: 0.94[Train] epoch: 9, step: 751, loss: 0.13489, accuracy: 0.94[Train] epoch: 9, step: 752, loss: 0.06690, accuracy: 1.00[Train] epoch: 9, step: 753, loss: 0.11271, accuracy: 0.97[Train] epoch: 9, step: 754, loss: 0.34419, accuracy: 0.84[Train] epoch: 9, step: 755, loss: 0.13545, accuracy: 0.91[Train] epoch: 9, step: 756, loss: 0.17191, accuracy: 0.94[Train] epoch: 9, step: 757, loss: 0.11578, accuracy: 0.94[Train] epoch: 9, step: 758, loss: 0.22629, accuracy: 0.91[Train] epoch: 9, step: 759, loss: 0.09125, accuracy: 0.97[Train] epoch: 9, step: 760, loss: 0.30250, accuracy: 0.91[Train] epoch: 9, step: 761, loss: 0.28943, accuracy: 0.88[Train] epoch: 9, step: 762, loss: 0.40741, accuracy: 0

[Train] epoch: 9, step: 1016, loss: 0.07695, accuracy: 0.97[Train] epoch: 9, step: 1017, loss: 0.15900, accuracy: 0.91[Train] epoch: 9, step: 1018, loss: 0.22939, accuracy: 0.91[Train] epoch: 9, step: 1019, loss: 0.08669, accuracy: 1.00[Train] epoch: 9, step: 1020, loss: 0.13486, accuracy: 0.91[Train] epoch: 9, step: 1021, loss: 0.28809, accuracy: 0.88[Train] epoch: 9, step: 1022, loss: 0.25587, accuracy: 0.84[Train] epoch: 9, step: 1023, loss: 0.14642, accuracy: 0.91[Train] epoch: 9, step: 1024, loss: 0.07187, accuracy: 1.00[Train] epoch: 9, step: 1025, loss: 0.08041, accuracy: 0.97[Train] epoch: 9, step: 1026, loss: 0.10453, accuracy: 0.97[Train] epoch: 9, step: 1027, loss: 0.34485, accuracy: 0.84[Train] epoch: 9, step: 1028, loss: 0.27294, accuracy: 0.91[Train] epoch: 9, step: 1029, loss: 0.42024, accuracy: 0.84[Train] epoch: 9, step: 1030, loss: 0.17830, accuracy: 0.94[Train] epoch: 9, step: 1031, loss: 0.13583, accuracy: 0.97[Train] epoch: 9, step: 1032, loss: 0.2

[Train] epoch: 9, step: 1290, loss: 0.26560, accuracy: 0.88[Train] epoch: 9, step: 1291, loss: 0.16131, accuracy: 0.97[Train] epoch: 9, step: 1292, loss: 0.34873, accuracy: 0.94[Train] epoch: 9, step: 1293, loss: 0.13558, accuracy: 0.97[Train] epoch: 9, step: 1294, loss: 0.16278, accuracy: 0.94[Train] epoch: 9, step: 1295, loss: 0.16911, accuracy: 0.94[Train] epoch: 9, step: 1296, loss: 0.10926, accuracy: 0.94[Train] epoch: 9, step: 1297, loss: 0.11658, accuracy: 1.00[Train] epoch: 9, step: 1298, loss: 0.14876, accuracy: 0.94[Train] epoch: 9, step: 1299, loss: 0.04262, accuracy: 1.00[Train] epoch: 9, step: 1300, loss: 0.23995, accuracy: 0.84[Train] epoch: 9, step: 1301, loss: 0.24213, accuracy: 0.97[Train] epoch: 9, step: 1302, loss: 0.06585, accuracy: 1.00[Train] epoch: 9, step: 1303, loss: 0.12092, accuracy: 0.97[Train] epoch: 9, step: 1304, loss: 0.11532, accuracy: 0.97[Train] epoch: 9, step: 1305, loss: 0.16389, accuracy: 0.88[Train] epoch: 9, step: 1306, loss: 0.1

[Train] epoch: 9, step: 1558, loss: 0.05415, accuracy: 1.00[Train] epoch: 9, step: 1559, loss: 0.13375, accuracy: 0.94[Train] epoch: 9, step: 1560, loss: 0.12791, accuracy: 0.94[Train] epoch: 9, step: 1561, loss: 0.57965, accuracy: 0.81[Train] epoch: 9, step: 1562, loss: 0.32375, accuracy: 0.94[Train] epoch: 9, step: 1563, loss: 0.31675, accuracy: 0.91[Train] epoch: 9, step: 1564, loss: 0.23145, accuracy: 0.91[Train] epoch: 9, step: 1565, loss: 0.04813, accuracy: 1.00[Train] epoch: 9, step: 1566, loss: 0.19418, accuracy: 0.91[Train] epoch: 9, step: 1567, loss: 0.19766, accuracy: 0.91[Train] epoch: 9, step: 1568, loss: 0.19285, accuracy: 0.94[Train] epoch: 9, step: 1569, loss: 0.19123, accuracy: 0.88[Train] epoch: 9, step: 1570, loss: 0.36402, accuracy: 0.91[Train] epoch: 9, step: 1571, loss: 0.21489, accuracy: 0.94[Train] epoch: 9, step: 1572, loss: 0.15778, accuracy: 0.94[Train] epoch: 9, step: 1573, loss: 0.27919, accuracy: 0.88[Train] epoch: 9, step: 1574, loss: 0.3