In [3]:
import torch
import random
import os.path 
import torch.nn as nn
import torch.optim as optim
import torch.utils.data as data_utils
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split
import seaborn as sns
sns.set()
%matplotlib inline
plt.rcParams['figure.figsize'] = [20, 12]

In [4]:
data = pd.read_csv('semiconductor_data.csv')

# pytorch - DNN

In [5]:
device = 'cuda' if torch.cuda.is_available() else 'cpu'

# for reproducibility
random.seed(777)
torch.manual_seed(777)
if device == 'cuda':
    torch.cuda.manual_seed_all(777)

In [6]:
batch_size = 100

In [7]:
data_y = data.iloc[:,0:4]
data_X = data.iloc[:,4:]

# X컬럼, y컬럼

In [8]:
X_train, X_test ,y_train, y_test = train_test_split(data_X, data_y, test_size =0.2, shuffle = True, random_state = 34)

In [9]:
X_train

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,216,217,218,219,220,221,222,223,224,225
252398,0.683640,0.679285,0.687704,0.702817,0.694823,0.685792,0.683390,0.693732,0.668570,0.682585,...,0.475220,0.531135,0.564734,0.604675,0.640205,0.682786,0.686973,0.723523,0.731965,0.738076
375014,0.332358,0.318606,0.246727,0.223866,0.155323,0.138727,0.096084,0.047101,0.053691,0.039030,...,0.519579,0.585246,0.633325,0.665797,0.726992,0.757880,0.788201,0.790893,0.808424,0.829081
689860,0.551035,0.532835,0.483259,0.481551,0.448323,0.397172,0.359607,0.318149,0.253995,0.220641,...,0.613345,0.587888,0.566582,0.530212,0.518400,0.490918,0.452409,0.438647,0.418731,0.426592
18308,0.455448,0.467373,0.489867,0.493057,0.495527,0.507048,0.510352,0.530834,0.532276,0.527841,...,0.547348,0.567351,0.561998,0.589129,0.590251,0.589697,0.575356,0.579927,0.558663,0.571098
233548,0.503726,0.510649,0.518636,0.511645,0.485977,0.468422,0.446883,0.434034,0.415850,0.374635,...,0.350297,0.425399,0.498031,0.558058,0.620943,0.637956,0.675910,0.704436,0.714564,0.732319
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
344388,0.463386,0.458658,0.423432,0.394419,0.361129,0.357560,0.306423,0.263402,0.229935,0.187258,...,0.630474,0.627672,0.594036,0.589035,0.571627,0.530546,0.489756,0.456401,0.433368,0.419712
199765,0.298856,0.274736,0.241236,0.178815,0.168395,0.141764,0.105932,0.106010,0.114444,0.116830,...,0.474156,0.482241,0.462963,0.480489,0.507966,0.544107,0.554938,0.579944,0.614293,0.659911
749302,0.443496,0.451008,0.453753,0.464541,0.439396,0.454021,0.437515,0.408460,0.375874,0.349867,...,0.569598,0.613377,0.650704,0.692446,0.747882,0.776932,0.812338,0.837335,0.861170,0.883665
153449,0.501820,0.516873,0.503262,0.508175,0.492493,0.490643,0.493181,0.456907,0.441586,0.439788,...,0.378347,0.323547,0.277093,0.243962,0.219240,0.225385,0.238944,0.292461,0.351568,0.415855


In [10]:
X_test

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,216,217,218,219,220,221,222,223,224,225
214807,0.467163,0.479334,0.489549,0.494989,0.507534,0.514008,0.510253,0.508540,0.503635,0.494057,...,0.704643,0.710210,0.690725,0.683060,0.663558,0.621325,0.584594,0.545804,0.480629,0.438945
348765,0.559535,0.541012,0.528609,0.535068,0.516287,0.505309,0.491363,0.470956,0.432487,0.411325,...,0.719153,0.736826,0.765203,0.752474,0.764567,0.785696,0.784772,0.795292,0.786475,0.792192
334741,0.145917,0.178505,0.220577,0.223307,0.267327,0.282841,0.312560,0.320670,0.361877,0.360909,...,0.505836,0.555443,0.617969,0.630148,0.682684,0.702607,0.701457,0.739281,0.743063,0.746500
797095,0.554574,0.539270,0.532405,0.509381,0.498265,0.458554,0.429688,0.383986,0.365510,0.295077,...,0.675402,0.752451,0.772690,0.802782,0.809580,0.825176,0.855060,0.836505,0.834213,0.856087
757558,0.254148,0.278256,0.313922,0.340954,0.359798,0.404477,0.400444,0.427255,0.423394,0.419597,...,0.627864,0.661306,0.678191,0.703718,0.706503,0.712651,0.722324,0.692188,0.692276,0.647929
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
93930,0.031821,0.046677,0.044728,0.062243,0.087108,0.089447,0.092434,0.104364,0.125859,0.157654,...,0.835447,0.839128,0.851595,0.837039,0.856049,0.857974,0.832757,0.832412,0.822721,0.841659
738915,0.014582,0.034210,0.049293,0.093599,0.109265,0.143028,0.199812,0.229780,0.249825,0.282928,...,0.655175,0.649591,0.617676,0.578506,0.551225,0.503142,0.462310,0.429930,0.394668,0.394451
451967,0.190829,0.197870,0.231471,0.243481,0.277680,0.315230,0.319812,0.364301,0.361262,0.400035,...,0.492536,0.556648,0.631500,0.670053,0.707219,0.730572,0.752236,0.776033,0.797662,0.809119
85103,0.232389,0.204789,0.197157,0.199841,0.172082,0.149741,0.132643,0.114304,0.111616,0.093542,...,0.910324,0.917928,0.906389,0.906940,0.896698,0.885482,0.877966,0.885524,0.872263,0.859362


In [11]:
y_train

Unnamed: 0,layer_1,layer_2,layer_3,layer_4
252398,100,110,140,90
375014,140,270,210,150
689860,260,170,160,110
18308,10,210,110,90
233548,90,200,150,290
...,...,...,...,...
344388,130,230,200,190
199765,80,120,290,260
749302,280,230,170,230
153449,60,210,150,300


In [12]:
y_test

Unnamed: 0,layer_1,layer_2,layer_3,layer_4
214807,80,290,210,80
348765,130,280,160,160
334741,130,120,290,20
797095,300,160,200,260
757558,290,20,220,290
...,...,...,...,...
93930,40,150,120,10
738915,280,120,10,160
451967,170,230,60,180
85103,40,50,170,240


In [13]:
trn_X = torch.from_numpy(X_train.astype(float).as_matrix())
trn_y = torch.from_numpy(y_train.astype(float).as_matrix())
val_X = torch.from_numpy(X_test.astype(float).as_matrix())
val_y = torch.from_numpy(y_test.astype(float).as_matrix())

  """Entry point for launching an IPython kernel.
  
  This is separate from the ipykernel package so we can avoid doing imports until
  after removing the cwd from sys.path.


In [14]:
len(trn_X[0])

226

In [15]:
len(trn_X)

648000

In [16]:
# for dictionary batch
class Dataset(data_utils.Dataset):
   
    def __init__(self, X, y):
        self.X = X
        self.y = y
   
    def __getitem__(self, idx):
        return {'X': self.X[idx], 'y': self.y[idx]}
   
    def __len__(self):
        return len(self.X)

In [17]:
trn = Dataset(trn_X, trn_y)
trn_loader = data_utils.DataLoader(trn, batch_size=batch_size, shuffle=True)

val = Dataset(val_X, val_y)
val_loader = data_utils.DataLoader(val, batch_size=batch_size, shuffle=False)

In [18]:
len(trn.X)

648000

In [19]:
tmp = next(iter(trn_loader)) # next(iter(객체)) -> 객체를읽어준다.

# build model

In [20]:
use_cuda = torch.cuda.is_available()

In [21]:
class MLPRegressor(nn.Module):
    def __init__(self):
        super(MLPRegressor, self).__init__()
        
        
        self.hidden = nn.Sequential(
            
        nn.Linear(226, 768),
        nn.BatchNorm1d(768),
        nn.Linear(768, 768),
        nn.ReLU(),
        nn.Dropout(0.2),
        nn.Linear(768, 768),
        nn.BatchNorm1d(768),
        nn.ReLU(),
        nn.Linear(768, 768),
        nn.BatchNorm1d(768),
        nn.ReLU(),
        nn.Dropout(0.2),
        nn.Linear(768, 768),
        nn.BatchNorm1d(768),
        nn.ReLU(),
        nn.Dropout(0.2),
        nn.Linear(768, 768),
        nn.BatchNorm1d(768),
        nn.ReLU(),
        nn.Linear(768, 4)

        )
        if use_cuda:
            self.hidden = self.hidden.cuda()
    def forward(self, x):
        o = self.hidden(x)
        return o
    

# Train model_mse,rmsprop

In [22]:
def mae(trn_pred, trn_y):
    abs_value = abs(trn_pred - trn_y)
    return abs_value

In [23]:
file = 'C:/Users/1-12/semiconductor_project/test_model.pth'

if os.path.isfile(file):
  model = MLPRegressor()
  model.load_state_dict(torch.load(file))
  model.eval()
  print("Yes. it is a file")

else : 
  model = MLPRegressor()
  print("create a new model")
# 예제 Textfil

Yes. it is a file


In [24]:
log_interval = 200
device = torch.device("cuda" if use_cuda else "cpu")

In [25]:
learning_rate = 1e-3
optimizer = optim.RMSprop(model.parameters(), lr=learning_rate)

In [28]:
epochs = 1000-49
batches = len(trn_loader)

In [None]:
trn_loss_list = []
val_loss_list = []

for epoch in range(epochs):
    trn_loss_summary = 0.0
    for i, trn in enumerate(trn_loader):
        trn_X, trn_y = trn['X'], trn['y']
        if use_cuda:
            trn_X, trn_y = trn_X.cuda(), trn_y.cuda()
        optimizer.zero_grad()
        trn_pred = model(trn_X.float())
        trn_loss = mae(trn_pred.double(), trn_y.double())
#         loss.backward()
        trn_loss.sum().backward()
        optimizer.step()
        
        trn_loss_summary += trn_loss.sum()
        
        if (i+1) % 15 == 0:
            with torch.no_grad():
                val_loss_summary = 0.0
                for j, val in enumerate(val_loader):
                    val_X, val_y = val['X'], val['y']
                    if use_cuda:
                        val_X, val_y = val_X.cuda(), val_y.cuda()
                    val_pred = model(val_X.float())
                    val_loss = mae(val_pred.double(), val_y.double())
                    val_loss_summary += val_loss.sum()
                
            print("epoch: {}/{} | step: {}/{} | trn_loss: {:.4f} | val_loss: {:.4f}".format(
                epoch + 1, epochs, i+1, batches, (trn_loss_summary/15)**(1/2), (val_loss_summary/len(val_loader))**(1/2)
            ))
                
            trn_loss_list.append((trn_loss_summary/15)**(1/2))
            val_loss_list.append((val_loss_summary/len(val_loader))**(1/2))
            trn_loss_summary = 0.0
            
        # 모델 저장
        savePath = "test_model.pth"
        torch.save(model.state_dict(), savePath)

print("finish Training")

epoch: 1/951 | step: 15/6480 | trn_loss: 32.8700 | val_loss: 32.9714
epoch: 1/951 | step: 30/6480 | trn_loss: 34.7986 | val_loss: 34.5318
epoch: 1/951 | step: 45/6480 | trn_loss: 34.3170 | val_loss: 34.3742
epoch: 1/951 | step: 60/6480 | trn_loss: 33.9791 | val_loss: 34.0433
epoch: 1/951 | step: 75/6480 | trn_loss: 32.8310 | val_loss: 32.1382
epoch: 1/951 | step: 90/6480 | trn_loss: 32.0434 | val_loss: 32.1570
epoch: 1/951 | step: 105/6480 | trn_loss: 32.8234 | val_loss: 33.2031
epoch: 1/951 | step: 120/6480 | trn_loss: 31.6780 | val_loss: 32.4720
epoch: 1/951 | step: 135/6480 | trn_loss: 32.2218 | val_loss: 32.4490
epoch: 1/951 | step: 150/6480 | trn_loss: 31.2902 | val_loss: 33.4102
epoch: 1/951 | step: 165/6480 | trn_loss: 31.0231 | val_loss: 33.3822
epoch: 1/951 | step: 180/6480 | trn_loss: 32.1445 | val_loss: 33.4149
epoch: 1/951 | step: 195/6480 | trn_loss: 31.5492 | val_loss: 32.8169
epoch: 1/951 | step: 210/6480 | trn_loss: 32.8797 | val_loss: 32.5961
epoch: 1/951 | step: 225/6

epoch: 1/951 | step: 1755/6480 | trn_loss: 29.8917 | val_loss: 32.7485
epoch: 1/951 | step: 1770/6480 | trn_loss: 31.6509 | val_loss: 31.1424
epoch: 1/951 | step: 1785/6480 | trn_loss: 30.1342 | val_loss: 30.5669
epoch: 1/951 | step: 1800/6480 | trn_loss: 31.3969 | val_loss: 32.5177
epoch: 1/951 | step: 1815/6480 | trn_loss: 32.1715 | val_loss: 31.1350
epoch: 1/951 | step: 1830/6480 | trn_loss: 30.5961 | val_loss: 30.0468
epoch: 1/951 | step: 1845/6480 | trn_loss: 30.3334 | val_loss: 30.3848
epoch: 1/951 | step: 1860/6480 | trn_loss: 30.3694 | val_loss: 30.5810
epoch: 1/951 | step: 1875/6480 | trn_loss: 29.5988 | val_loss: 32.3973
epoch: 1/951 | step: 1890/6480 | trn_loss: 30.5280 | val_loss: 31.0273
epoch: 1/951 | step: 1905/6480 | trn_loss: 31.0122 | val_loss: 31.8671
epoch: 1/951 | step: 1920/6480 | trn_loss: 31.9306 | val_loss: 29.3464
epoch: 1/951 | step: 1935/6480 | trn_loss: 29.8669 | val_loss: 31.1835
epoch: 1/951 | step: 1950/6480 | trn_loss: 30.7552 | val_loss: 29.1811
epoch:

epoch: 1/951 | step: 3480/6480 | trn_loss: 29.4617 | val_loss: 29.1385
epoch: 1/951 | step: 3495/6480 | trn_loss: 29.7603 | val_loss: 31.1879
epoch: 1/951 | step: 3510/6480 | trn_loss: 29.6593 | val_loss: 29.4578
epoch: 1/951 | step: 3525/6480 | trn_loss: 30.0180 | val_loss: 29.8243
epoch: 1/951 | step: 3540/6480 | trn_loss: 30.0644 | val_loss: 28.5975
epoch: 1/951 | step: 3555/6480 | trn_loss: 29.5537 | val_loss: 29.5136
epoch: 1/951 | step: 3570/6480 | trn_loss: 29.9393 | val_loss: 30.1789
epoch: 1/951 | step: 3585/6480 | trn_loss: 29.8088 | val_loss: 30.1164
epoch: 1/951 | step: 3600/6480 | trn_loss: 28.9002 | val_loss: 29.7608
epoch: 1/951 | step: 3615/6480 | trn_loss: 29.4603 | val_loss: 31.8132
epoch: 1/951 | step: 3630/6480 | trn_loss: 29.1723 | val_loss: 29.4342
epoch: 1/951 | step: 3645/6480 | trn_loss: 29.0602 | val_loss: 28.2689
epoch: 1/951 | step: 3660/6480 | trn_loss: 28.3979 | val_loss: 30.1042
epoch: 1/951 | step: 3675/6480 | trn_loss: 30.2440 | val_loss: 29.5115
epoch:

epoch: 1/951 | step: 5205/6480 | trn_loss: 29.9256 | val_loss: 28.9472
epoch: 1/951 | step: 5220/6480 | trn_loss: 27.9144 | val_loss: 29.3253
epoch: 1/951 | step: 5235/6480 | trn_loss: 28.8686 | val_loss: 30.0924
epoch: 1/951 | step: 5250/6480 | trn_loss: 28.6507 | val_loss: 29.2797
epoch: 1/951 | step: 5265/6480 | trn_loss: 29.0077 | val_loss: 28.8615
epoch: 1/951 | step: 5280/6480 | trn_loss: 30.5233 | val_loss: 32.0612
epoch: 1/951 | step: 5295/6480 | trn_loss: 28.7644 | val_loss: 29.1915
epoch: 1/951 | step: 5310/6480 | trn_loss: 29.5121 | val_loss: 28.9739
epoch: 1/951 | step: 5325/6480 | trn_loss: 28.8389 | val_loss: 27.9328
epoch: 1/951 | step: 5340/6480 | trn_loss: 28.5747 | val_loss: 28.5213
epoch: 1/951 | step: 5355/6480 | trn_loss: 29.3545 | val_loss: 30.6197
epoch: 1/951 | step: 5370/6480 | trn_loss: 28.9765 | val_loss: 28.5052
epoch: 1/951 | step: 5385/6480 | trn_loss: 29.3647 | val_loss: 29.8006
epoch: 1/951 | step: 5400/6480 | trn_loss: 28.0988 | val_loss: 28.1096
epoch:

epoch: 2/951 | step: 450/6480 | trn_loss: 28.0877 | val_loss: 29.2837
epoch: 2/951 | step: 465/6480 | trn_loss: 28.5905 | val_loss: 28.3329
epoch: 2/951 | step: 480/6480 | trn_loss: 28.0915 | val_loss: 28.5207
epoch: 2/951 | step: 495/6480 | trn_loss: 27.0672 | val_loss: 27.5342
epoch: 2/951 | step: 510/6480 | trn_loss: 28.2274 | val_loss: 29.2693
epoch: 2/951 | step: 525/6480 | trn_loss: 29.5398 | val_loss: 28.9987
epoch: 2/951 | step: 540/6480 | trn_loss: 27.9526 | val_loss: 30.9545
epoch: 2/951 | step: 555/6480 | trn_loss: 27.8127 | val_loss: 28.6642
epoch: 2/951 | step: 570/6480 | trn_loss: 27.7638 | val_loss: 30.2136
epoch: 2/951 | step: 585/6480 | trn_loss: 29.7149 | val_loss: 28.8789
epoch: 2/951 | step: 600/6480 | trn_loss: 29.2383 | val_loss: 29.3176
epoch: 2/951 | step: 615/6480 | trn_loss: 29.0108 | val_loss: 28.6962
epoch: 2/951 | step: 630/6480 | trn_loss: 28.1294 | val_loss: 28.7908
epoch: 2/951 | step: 645/6480 | trn_loss: 28.1445 | val_loss: 29.9409
epoch: 2/951 | step:

epoch: 2/951 | step: 2175/6480 | trn_loss: 27.6980 | val_loss: 29.2607
epoch: 2/951 | step: 2190/6480 | trn_loss: 27.9685 | val_loss: 28.5939
epoch: 2/951 | step: 2205/6480 | trn_loss: 27.8623 | val_loss: 28.0118
epoch: 2/951 | step: 2220/6480 | trn_loss: 27.5345 | val_loss: 28.0672
epoch: 2/951 | step: 2235/6480 | trn_loss: 27.3948 | val_loss: 28.2710
epoch: 2/951 | step: 2250/6480 | trn_loss: 28.5748 | val_loss: 27.6370
epoch: 2/951 | step: 2265/6480 | trn_loss: 28.0008 | val_loss: 27.5977
epoch: 2/951 | step: 2280/6480 | trn_loss: 27.2392 | val_loss: 27.5562
epoch: 2/951 | step: 2295/6480 | trn_loss: 28.7959 | val_loss: 28.3884
epoch: 2/951 | step: 2310/6480 | trn_loss: 27.8158 | val_loss: 29.3811
epoch: 2/951 | step: 2325/6480 | trn_loss: 28.6518 | val_loss: 27.7881
epoch: 2/951 | step: 2340/6480 | trn_loss: 28.9227 | val_loss: 29.0997
epoch: 2/951 | step: 2355/6480 | trn_loss: 28.6428 | val_loss: 28.9236
epoch: 2/951 | step: 2370/6480 | trn_loss: 28.1285 | val_loss: 30.0919
epoch:

epoch: 2/951 | step: 3900/6480 | trn_loss: 28.9103 | val_loss: 28.2577
epoch: 2/951 | step: 3915/6480 | trn_loss: 27.9582 | val_loss: 27.3510
epoch: 2/951 | step: 3930/6480 | trn_loss: 29.4973 | val_loss: 28.7304
epoch: 2/951 | step: 3945/6480 | trn_loss: 27.9194 | val_loss: 26.4492
epoch: 2/951 | step: 3960/6480 | trn_loss: 27.2090 | val_loss: 30.2863
epoch: 2/951 | step: 3975/6480 | trn_loss: 27.5610 | val_loss: 28.8334
epoch: 2/951 | step: 3990/6480 | trn_loss: 27.5372 | val_loss: 28.6277
epoch: 2/951 | step: 4005/6480 | trn_loss: 27.4165 | val_loss: 28.8357
epoch: 2/951 | step: 4020/6480 | trn_loss: 28.4628 | val_loss: 27.0569
epoch: 2/951 | step: 4035/6480 | trn_loss: 27.9335 | val_loss: 27.5418
epoch: 2/951 | step: 4050/6480 | trn_loss: 26.5624 | val_loss: 27.6284
epoch: 2/951 | step: 4065/6480 | trn_loss: 27.6738 | val_loss: 34.6785
epoch: 2/951 | step: 4080/6480 | trn_loss: 28.9747 | val_loss: 30.2544
epoch: 2/951 | step: 4095/6480 | trn_loss: 27.9936 | val_loss: 29.2119
epoch:

epoch: 2/951 | step: 5625/6480 | trn_loss: 27.4559 | val_loss: 28.4510
epoch: 2/951 | step: 5640/6480 | trn_loss: 28.0571 | val_loss: 28.0634
epoch: 2/951 | step: 5655/6480 | trn_loss: 26.6636 | val_loss: 26.9678
epoch: 2/951 | step: 5670/6480 | trn_loss: 28.1594 | val_loss: 27.0199
epoch: 2/951 | step: 5685/6480 | trn_loss: 27.3719 | val_loss: 28.4763
epoch: 2/951 | step: 5700/6480 | trn_loss: 27.7149 | val_loss: 27.1462
epoch: 2/951 | step: 5715/6480 | trn_loss: 27.2700 | val_loss: 28.4967
epoch: 2/951 | step: 5730/6480 | trn_loss: 27.1532 | val_loss: 27.5117
epoch: 2/951 | step: 5745/6480 | trn_loss: 27.0146 | val_loss: 27.4002
epoch: 2/951 | step: 5760/6480 | trn_loss: 27.3096 | val_loss: 27.9008
epoch: 2/951 | step: 5775/6480 | trn_loss: 28.5358 | val_loss: 27.7918
epoch: 2/951 | step: 5790/6480 | trn_loss: 26.8618 | val_loss: 29.4749
epoch: 2/951 | step: 5805/6480 | trn_loss: 27.1159 | val_loss: 26.6171
epoch: 2/951 | step: 5820/6480 | trn_loss: 26.2736 | val_loss: 30.0454
epoch:

epoch: 3/951 | step: 885/6480 | trn_loss: 28.0316 | val_loss: 28.0330
epoch: 3/951 | step: 900/6480 | trn_loss: 27.3470 | val_loss: 29.3108
epoch: 3/951 | step: 915/6480 | trn_loss: 26.2789 | val_loss: 27.6784
epoch: 3/951 | step: 930/6480 | trn_loss: 27.8565 | val_loss: 28.6755
epoch: 3/951 | step: 945/6480 | trn_loss: 26.1600 | val_loss: 27.1607
epoch: 3/951 | step: 960/6480 | trn_loss: 27.5580 | val_loss: 27.4820
epoch: 3/951 | step: 975/6480 | trn_loss: 27.3670 | val_loss: 27.2647
epoch: 3/951 | step: 990/6480 | trn_loss: 26.9549 | val_loss: 27.9150
epoch: 3/951 | step: 1005/6480 | trn_loss: 27.5406 | val_loss: 26.5395
epoch: 3/951 | step: 1020/6480 | trn_loss: 26.0911 | val_loss: 27.5580
epoch: 3/951 | step: 1035/6480 | trn_loss: 27.6285 | val_loss: 28.7889
epoch: 3/951 | step: 1050/6480 | trn_loss: 27.3605 | val_loss: 27.4053
epoch: 3/951 | step: 1065/6480 | trn_loss: 26.6647 | val_loss: 28.3068
epoch: 3/951 | step: 1080/6480 | trn_loss: 26.5227 | val_loss: 27.3424
epoch: 3/951 |

epoch: 3/951 | step: 2610/6480 | trn_loss: 27.5477 | val_loss: 27.8734
epoch: 3/951 | step: 2625/6480 | trn_loss: 26.3908 | val_loss: 27.8966
epoch: 3/951 | step: 2640/6480 | trn_loss: 26.9513 | val_loss: 28.9967
epoch: 3/951 | step: 2655/6480 | trn_loss: 27.1420 | val_loss: 27.3138
epoch: 3/951 | step: 2670/6480 | trn_loss: 26.5170 | val_loss: 27.5300
epoch: 3/951 | step: 2685/6480 | trn_loss: 28.1434 | val_loss: 28.6850
epoch: 3/951 | step: 2700/6480 | trn_loss: 27.0824 | val_loss: 27.4007
epoch: 3/951 | step: 2715/6480 | trn_loss: 26.4669 | val_loss: 27.8339
epoch: 3/951 | step: 2730/6480 | trn_loss: 26.6253 | val_loss: 28.9554
epoch: 3/951 | step: 2745/6480 | trn_loss: 26.6986 | val_loss: 27.4582
epoch: 3/951 | step: 2760/6480 | trn_loss: 29.0254 | val_loss: 27.4427
epoch: 3/951 | step: 2775/6480 | trn_loss: 26.5008 | val_loss: 25.8709
epoch: 3/951 | step: 2790/6480 | trn_loss: 25.9948 | val_loss: 27.6992
epoch: 3/951 | step: 2805/6480 | trn_loss: 27.4345 | val_loss: 27.2328
epoch:

epoch: 3/951 | step: 4335/6480 | trn_loss: 27.3853 | val_loss: 28.2544
epoch: 3/951 | step: 4350/6480 | trn_loss: 26.6144 | val_loss: 29.0184
epoch: 3/951 | step: 4365/6480 | trn_loss: 27.3126 | val_loss: 26.0824
epoch: 3/951 | step: 4380/6480 | trn_loss: 26.8352 | val_loss: 28.3584
epoch: 3/951 | step: 4395/6480 | trn_loss: 27.4443 | val_loss: 27.1541
epoch: 3/951 | step: 4410/6480 | trn_loss: 26.3641 | val_loss: 25.7978
epoch: 3/951 | step: 4425/6480 | trn_loss: 25.6593 | val_loss: 26.8608
epoch: 3/951 | step: 4440/6480 | trn_loss: 26.8549 | val_loss: 26.1954
epoch: 3/951 | step: 4455/6480 | trn_loss: 26.7891 | val_loss: 27.6716
epoch: 3/951 | step: 4470/6480 | trn_loss: 27.1706 | val_loss: 28.5850
epoch: 3/951 | step: 4485/6480 | trn_loss: 26.4059 | val_loss: 26.3960
epoch: 3/951 | step: 4500/6480 | trn_loss: 26.4641 | val_loss: 27.0882
epoch: 3/951 | step: 4515/6480 | trn_loss: 28.1528 | val_loss: 32.4480
epoch: 3/951 | step: 4530/6480 | trn_loss: 26.2995 | val_loss: 27.0909
epoch:

epoch: 3/951 | step: 6060/6480 | trn_loss: 26.6442 | val_loss: 26.7816
epoch: 3/951 | step: 6075/6480 | trn_loss: 25.9892 | val_loss: 26.6933
epoch: 3/951 | step: 6090/6480 | trn_loss: 26.3337 | val_loss: 28.8022
epoch: 3/951 | step: 6105/6480 | trn_loss: 27.1142 | val_loss: 28.1743
epoch: 3/951 | step: 6120/6480 | trn_loss: 25.7943 | val_loss: 26.1844
epoch: 3/951 | step: 6135/6480 | trn_loss: 27.3577 | val_loss: 26.3163
epoch: 3/951 | step: 6150/6480 | trn_loss: 26.0226 | val_loss: 26.0473
epoch: 3/951 | step: 6165/6480 | trn_loss: 26.1975 | val_loss: 27.0471
epoch: 3/951 | step: 6180/6480 | trn_loss: 27.3387 | val_loss: 28.2747
epoch: 3/951 | step: 6195/6480 | trn_loss: 26.9476 | val_loss: 26.5338
epoch: 3/951 | step: 6210/6480 | trn_loss: 26.3445 | val_loss: 26.0085
epoch: 3/951 | step: 6225/6480 | trn_loss: 26.0797 | val_loss: 27.3617
epoch: 3/951 | step: 6240/6480 | trn_loss: 27.7380 | val_loss: 26.8563
epoch: 3/951 | step: 6255/6480 | trn_loss: 28.1312 | val_loss: 28.1371
epoch:

epoch: 4/951 | step: 1320/6480 | trn_loss: 24.9944 | val_loss: 28.0990
epoch: 4/951 | step: 1335/6480 | trn_loss: 27.2932 | val_loss: 27.2056
epoch: 4/951 | step: 1350/6480 | trn_loss: 26.7499 | val_loss: 26.9576
epoch: 4/951 | step: 1365/6480 | trn_loss: 25.5582 | val_loss: 27.3340
epoch: 4/951 | step: 1380/6480 | trn_loss: 26.1058 | val_loss: 26.2002
epoch: 4/951 | step: 1395/6480 | trn_loss: 26.9080 | val_loss: 27.0684
epoch: 4/951 | step: 1410/6480 | trn_loss: 26.2370 | val_loss: 27.8419
epoch: 4/951 | step: 1425/6480 | trn_loss: 26.1152 | val_loss: 25.8709
epoch: 4/951 | step: 1440/6480 | trn_loss: 26.3289 | val_loss: 25.7845
epoch: 4/951 | step: 1455/6480 | trn_loss: 26.4081 | val_loss: 27.1229
epoch: 4/951 | step: 1470/6480 | trn_loss: 26.5673 | val_loss: 25.6536
epoch: 4/951 | step: 1485/6480 | trn_loss: 25.4572 | val_loss: 26.6474
epoch: 4/951 | step: 1500/6480 | trn_loss: 26.6665 | val_loss: 27.7108
epoch: 4/951 | step: 1515/6480 | trn_loss: 26.4758 | val_loss: 28.8921
epoch:

epoch: 4/951 | step: 3045/6480 | trn_loss: 25.4547 | val_loss: 25.5887
epoch: 4/951 | step: 3060/6480 | trn_loss: 25.5370 | val_loss: 25.5252
epoch: 4/951 | step: 3075/6480 | trn_loss: 26.7223 | val_loss: 26.1876
epoch: 4/951 | step: 3090/6480 | trn_loss: 26.2938 | val_loss: 26.5485
epoch: 4/951 | step: 3105/6480 | trn_loss: 26.6461 | val_loss: 27.6002
epoch: 4/951 | step: 3120/6480 | trn_loss: 25.3049 | val_loss: 26.8903
epoch: 4/951 | step: 3135/6480 | trn_loss: 26.0729 | val_loss: 30.1171
epoch: 4/951 | step: 3150/6480 | trn_loss: 26.0991 | val_loss: 27.6333
epoch: 4/951 | step: 3165/6480 | trn_loss: 27.2848 | val_loss: 27.1618
epoch: 4/951 | step: 3180/6480 | trn_loss: 27.4401 | val_loss: 27.7520
epoch: 4/951 | step: 3195/6480 | trn_loss: 27.4900 | val_loss: 26.3219
epoch: 4/951 | step: 3210/6480 | trn_loss: 26.1206 | val_loss: 26.4570
epoch: 4/951 | step: 3225/6480 | trn_loss: 27.3132 | val_loss: 27.6237
epoch: 4/951 | step: 3240/6480 | trn_loss: 25.9375 | val_loss: 27.7928
epoch:

epoch: 4/951 | step: 4770/6480 | trn_loss: 25.5459 | val_loss: 26.1447
epoch: 4/951 | step: 4785/6480 | trn_loss: 25.8192 | val_loss: 26.4972
epoch: 4/951 | step: 4800/6480 | trn_loss: 26.5379 | val_loss: 26.3539
epoch: 4/951 | step: 4815/6480 | trn_loss: 26.6147 | val_loss: 27.4966
epoch: 4/951 | step: 4830/6480 | trn_loss: 27.0690 | val_loss: 26.3789
epoch: 4/951 | step: 4845/6480 | trn_loss: 25.5170 | val_loss: 26.9730
epoch: 4/951 | step: 4860/6480 | trn_loss: 26.5723 | val_loss: 25.4516
epoch: 4/951 | step: 4875/6480 | trn_loss: 26.4998 | val_loss: 26.9325
epoch: 4/951 | step: 4890/6480 | trn_loss: 26.0875 | val_loss: 25.9809
epoch: 4/951 | step: 4905/6480 | trn_loss: 26.7265 | val_loss: 26.5006
epoch: 4/951 | step: 4920/6480 | trn_loss: 25.7011 | val_loss: 25.7072
epoch: 4/951 | step: 4935/6480 | trn_loss: 24.8772 | val_loss: 25.8970
epoch: 4/951 | step: 4950/6480 | trn_loss: 26.1354 | val_loss: 29.3363
epoch: 4/951 | step: 4965/6480 | trn_loss: 26.4557 | val_loss: 25.8441
epoch:

epoch: 5/951 | step: 15/6480 | trn_loss: 24.6047 | val_loss: 26.4641
epoch: 5/951 | step: 30/6480 | trn_loss: 26.9211 | val_loss: 26.2312
epoch: 5/951 | step: 45/6480 | trn_loss: 26.6897 | val_loss: 25.6669
epoch: 5/951 | step: 60/6480 | trn_loss: 25.8074 | val_loss: 25.4549
epoch: 5/951 | step: 75/6480 | trn_loss: 25.6694 | val_loss: 27.3448
epoch: 5/951 | step: 90/6480 | trn_loss: 25.2418 | val_loss: 25.4133
epoch: 5/951 | step: 105/6480 | trn_loss: 25.8344 | val_loss: 24.3733
epoch: 5/951 | step: 120/6480 | trn_loss: 24.4982 | val_loss: 25.5435
epoch: 5/951 | step: 135/6480 | trn_loss: 25.8633 | val_loss: 25.4644
epoch: 5/951 | step: 150/6480 | trn_loss: 24.7773 | val_loss: 26.6134
epoch: 5/951 | step: 165/6480 | trn_loss: 25.9237 | val_loss: 26.7043
epoch: 5/951 | step: 180/6480 | trn_loss: 24.7081 | val_loss: 25.0008
epoch: 5/951 | step: 195/6480 | trn_loss: 26.2357 | val_loss: 27.2135
epoch: 5/951 | step: 210/6480 | trn_loss: 26.3046 | val_loss: 27.1944
epoch: 5/951 | step: 225/6

epoch: 5/951 | step: 1755/6480 | trn_loss: 25.8821 | val_loss: 24.9568
epoch: 5/951 | step: 1770/6480 | trn_loss: 26.3130 | val_loss: 25.9116
epoch: 5/951 | step: 1785/6480 | trn_loss: 24.4004 | val_loss: 27.1413
epoch: 5/951 | step: 1800/6480 | trn_loss: 25.2083 | val_loss: 26.7335
epoch: 5/951 | step: 1815/6480 | trn_loss: 25.6925 | val_loss: 26.4621
epoch: 5/951 | step: 1830/6480 | trn_loss: 24.9464 | val_loss: 25.7535
epoch: 5/951 | step: 1845/6480 | trn_loss: 25.3201 | val_loss: 26.2514
epoch: 5/951 | step: 1860/6480 | trn_loss: 26.5560 | val_loss: 25.0826
epoch: 5/951 | step: 1875/6480 | trn_loss: 25.2827 | val_loss: 25.7945
epoch: 5/951 | step: 1890/6480 | trn_loss: 24.7334 | val_loss: 24.4446
epoch: 5/951 | step: 1905/6480 | trn_loss: 25.8206 | val_loss: 25.4131
epoch: 5/951 | step: 1920/6480 | trn_loss: 25.6446 | val_loss: 27.4607
epoch: 5/951 | step: 1935/6480 | trn_loss: 25.1028 | val_loss: 25.6921
epoch: 5/951 | step: 1950/6480 | trn_loss: 25.9282 | val_loss: 27.0803
epoch:

epoch: 5/951 | step: 3480/6480 | trn_loss: 24.8273 | val_loss: 26.4134
epoch: 5/951 | step: 3495/6480 | trn_loss: 25.4375 | val_loss: 26.7397
epoch: 5/951 | step: 3510/6480 | trn_loss: 25.8443 | val_loss: 29.2348
epoch: 5/951 | step: 3525/6480 | trn_loss: 26.2481 | val_loss: 25.8259
epoch: 5/951 | step: 3540/6480 | trn_loss: 26.4917 | val_loss: 27.0341
epoch: 5/951 | step: 3555/6480 | trn_loss: 25.2423 | val_loss: 25.6159
epoch: 5/951 | step: 3570/6480 | trn_loss: 25.0176 | val_loss: 26.4657
epoch: 5/951 | step: 3585/6480 | trn_loss: 26.0474 | val_loss: 26.2651
epoch: 5/951 | step: 3600/6480 | trn_loss: 24.8919 | val_loss: 26.5594
epoch: 5/951 | step: 3615/6480 | trn_loss: 26.5291 | val_loss: 26.2377
epoch: 5/951 | step: 3630/6480 | trn_loss: 25.3021 | val_loss: 27.5857
epoch: 5/951 | step: 3645/6480 | trn_loss: 25.4556 | val_loss: 26.0605
epoch: 5/951 | step: 3660/6480 | trn_loss: 25.8162 | val_loss: 25.8274
epoch: 5/951 | step: 3675/6480 | trn_loss: 25.2625 | val_loss: 26.1281
epoch:

epoch: 5/951 | step: 5205/6480 | trn_loss: 26.2410 | val_loss: 27.0952
epoch: 5/951 | step: 5220/6480 | trn_loss: 25.7547 | val_loss: 25.4295
epoch: 5/951 | step: 5235/6480 | trn_loss: 25.1653 | val_loss: 26.1805
epoch: 5/951 | step: 5250/6480 | trn_loss: 25.1056 | val_loss: 24.6680
epoch: 5/951 | step: 5265/6480 | trn_loss: 25.0204 | val_loss: 27.3730
epoch: 5/951 | step: 5280/6480 | trn_loss: 25.3631 | val_loss: 25.9713
epoch: 5/951 | step: 5295/6480 | trn_loss: 24.7790 | val_loss: 24.6573
epoch: 5/951 | step: 5310/6480 | trn_loss: 25.0917 | val_loss: 25.9845
epoch: 5/951 | step: 5325/6480 | trn_loss: 24.1928 | val_loss: 25.8259
epoch: 5/951 | step: 5340/6480 | trn_loss: 24.7736 | val_loss: 27.0466
epoch: 5/951 | step: 5355/6480 | trn_loss: 26.4120 | val_loss: 25.4527
epoch: 5/951 | step: 5370/6480 | trn_loss: 25.4306 | val_loss: 25.9824
epoch: 5/951 | step: 5385/6480 | trn_loss: 25.0321 | val_loss: 25.6282
epoch: 5/951 | step: 5400/6480 | trn_loss: 25.3480 | val_loss: 25.3167
epoch:

epoch: 6/951 | step: 450/6480 | trn_loss: 24.0403 | val_loss: 24.6610
epoch: 6/951 | step: 465/6480 | trn_loss: 24.9177 | val_loss: 25.4096
epoch: 6/951 | step: 480/6480 | trn_loss: 24.2763 | val_loss: 25.3043
epoch: 6/951 | step: 495/6480 | trn_loss: 25.2975 | val_loss: 25.6997
epoch: 6/951 | step: 510/6480 | trn_loss: 25.7021 | val_loss: 25.8080
epoch: 6/951 | step: 525/6480 | trn_loss: 25.2194 | val_loss: 28.3490
epoch: 6/951 | step: 540/6480 | trn_loss: 24.4891 | val_loss: 24.6741
epoch: 6/951 | step: 555/6480 | trn_loss: 25.1930 | val_loss: 26.1013
epoch: 6/951 | step: 570/6480 | trn_loss: 24.7849 | val_loss: 25.4580
epoch: 6/951 | step: 585/6480 | trn_loss: 24.9531 | val_loss: 25.6639
epoch: 6/951 | step: 600/6480 | trn_loss: 24.8820 | val_loss: 25.0813
epoch: 6/951 | step: 615/6480 | trn_loss: 25.3204 | val_loss: 25.2327
epoch: 6/951 | step: 630/6480 | trn_loss: 25.9069 | val_loss: 25.5095
epoch: 6/951 | step: 645/6480 | trn_loss: 24.5198 | val_loss: 27.7782
epoch: 6/951 | step:

epoch: 6/951 | step: 2175/6480 | trn_loss: 24.4388 | val_loss: 26.5733
epoch: 6/951 | step: 2190/6480 | trn_loss: 24.8922 | val_loss: 33.0624
epoch: 6/951 | step: 2205/6480 | trn_loss: 26.2423 | val_loss: 26.1423
epoch: 6/951 | step: 2220/6480 | trn_loss: 25.2578 | val_loss: 25.6496
epoch: 6/951 | step: 2235/6480 | trn_loss: 25.2362 | val_loss: 23.7632
epoch: 6/951 | step: 2250/6480 | trn_loss: 25.9771 | val_loss: 25.5740
epoch: 6/951 | step: 2265/6480 | trn_loss: 25.2564 | val_loss: 24.5922
epoch: 6/951 | step: 2280/6480 | trn_loss: 24.7912 | val_loss: 25.2506
epoch: 6/951 | step: 2295/6480 | trn_loss: 25.5249 | val_loss: 26.4195
epoch: 6/951 | step: 2310/6480 | trn_loss: 25.1349 | val_loss: 25.2333
epoch: 6/951 | step: 2325/6480 | trn_loss: 24.2633 | val_loss: 24.7996
epoch: 6/951 | step: 2340/6480 | trn_loss: 24.3896 | val_loss: 25.7388
epoch: 6/951 | step: 2355/6480 | trn_loss: 25.5459 | val_loss: 25.7467
epoch: 6/951 | step: 2370/6480 | trn_loss: 25.2952 | val_loss: 25.3775
epoch:

epoch: 6/951 | step: 3900/6480 | trn_loss: 24.6964 | val_loss: 24.6459
epoch: 6/951 | step: 3915/6480 | trn_loss: 24.7945 | val_loss: 28.1401
epoch: 6/951 | step: 3930/6480 | trn_loss: 25.5406 | val_loss: 25.4971
epoch: 6/951 | step: 3945/6480 | trn_loss: 25.2751 | val_loss: 26.0349
epoch: 6/951 | step: 3960/6480 | trn_loss: 24.9562 | val_loss: 26.5096
epoch: 6/951 | step: 3975/6480 | trn_loss: 27.6575 | val_loss: 26.0099
epoch: 6/951 | step: 3990/6480 | trn_loss: 24.5769 | val_loss: 24.9070
epoch: 6/951 | step: 4005/6480 | trn_loss: 24.9972 | val_loss: 24.6028
epoch: 6/951 | step: 4020/6480 | trn_loss: 24.6235 | val_loss: 25.8570
epoch: 6/951 | step: 4035/6480 | trn_loss: 24.5940 | val_loss: 25.0710
epoch: 6/951 | step: 4050/6480 | trn_loss: 25.1834 | val_loss: 26.6912
epoch: 6/951 | step: 4065/6480 | trn_loss: 24.5909 | val_loss: 25.3294
epoch: 6/951 | step: 4080/6480 | trn_loss: 25.0069 | val_loss: 26.4260
epoch: 6/951 | step: 4095/6480 | trn_loss: 26.0669 | val_loss: 26.3996
epoch:

epoch: 6/951 | step: 5625/6480 | trn_loss: 24.6335 | val_loss: 26.7517
epoch: 6/951 | step: 5640/6480 | trn_loss: 26.3605 | val_loss: 25.0024
epoch: 6/951 | step: 5655/6480 | trn_loss: 25.4634 | val_loss: 24.9183
epoch: 6/951 | step: 5670/6480 | trn_loss: 24.1568 | val_loss: 24.8410
epoch: 6/951 | step: 5685/6480 | trn_loss: 26.1867 | val_loss: 26.9751
epoch: 6/951 | step: 5700/6480 | trn_loss: 24.8904 | val_loss: 27.0972
epoch: 6/951 | step: 5715/6480 | trn_loss: 25.8321 | val_loss: 25.4842
epoch: 6/951 | step: 5730/6480 | trn_loss: 24.4424 | val_loss: 26.5151
epoch: 6/951 | step: 5745/6480 | trn_loss: 25.3144 | val_loss: 26.2434
epoch: 6/951 | step: 5760/6480 | trn_loss: 25.3404 | val_loss: 26.3186
epoch: 6/951 | step: 5775/6480 | trn_loss: 25.0223 | val_loss: 27.8854
epoch: 6/951 | step: 5790/6480 | trn_loss: 25.2806 | val_loss: 27.0023
epoch: 6/951 | step: 5805/6480 | trn_loss: 26.0652 | val_loss: 25.3642
epoch: 6/951 | step: 5820/6480 | trn_loss: 25.6014 | val_loss: 25.6827
epoch:

epoch: 7/951 | step: 885/6480 | trn_loss: 24.2414 | val_loss: 24.2792
epoch: 7/951 | step: 900/6480 | trn_loss: 24.7483 | val_loss: 24.6496
epoch: 7/951 | step: 915/6480 | trn_loss: 25.3410 | val_loss: 28.5853
epoch: 7/951 | step: 930/6480 | trn_loss: 24.4460 | val_loss: 25.9312
epoch: 7/951 | step: 945/6480 | trn_loss: 25.1374 | val_loss: 25.2948
epoch: 7/951 | step: 960/6480 | trn_loss: 25.2962 | val_loss: 26.0130
epoch: 7/951 | step: 975/6480 | trn_loss: 25.8166 | val_loss: 25.7434
epoch: 7/951 | step: 990/6480 | trn_loss: 24.0896 | val_loss: 25.6525
epoch: 7/951 | step: 1005/6480 | trn_loss: 24.5965 | val_loss: 26.3093
epoch: 7/951 | step: 1020/6480 | trn_loss: 24.5996 | val_loss: 26.2954
epoch: 7/951 | step: 1035/6480 | trn_loss: 23.6508 | val_loss: 24.9974
epoch: 7/951 | step: 1050/6480 | trn_loss: 24.2625 | val_loss: 25.6612
epoch: 7/951 | step: 1065/6480 | trn_loss: 24.3614 | val_loss: 24.9477
epoch: 7/951 | step: 1080/6480 | trn_loss: 24.9511 | val_loss: 25.3063
epoch: 7/951 |

epoch: 7/951 | step: 2610/6480 | trn_loss: 24.3593 | val_loss: 25.3370
epoch: 7/951 | step: 2625/6480 | trn_loss: 24.1211 | val_loss: 24.8660
epoch: 7/951 | step: 2640/6480 | trn_loss: 24.9951 | val_loss: 25.1676
epoch: 7/951 | step: 2655/6480 | trn_loss: 24.3200 | val_loss: 26.0222
epoch: 7/951 | step: 2670/6480 | trn_loss: 25.0338 | val_loss: 24.0684
epoch: 7/951 | step: 2685/6480 | trn_loss: 25.0533 | val_loss: 25.3971
epoch: 7/951 | step: 2700/6480 | trn_loss: 24.9144 | val_loss: 26.4239
epoch: 7/951 | step: 2715/6480 | trn_loss: 24.2842 | val_loss: 25.1453
epoch: 7/951 | step: 2730/6480 | trn_loss: 24.2246 | val_loss: 25.1932
epoch: 7/951 | step: 2745/6480 | trn_loss: 24.3450 | val_loss: 26.5113
epoch: 7/951 | step: 2760/6480 | trn_loss: 26.4419 | val_loss: 25.7664
epoch: 7/951 | step: 2775/6480 | trn_loss: 24.4514 | val_loss: 25.1974
epoch: 7/951 | step: 2790/6480 | trn_loss: 23.4924 | val_loss: 25.2536
epoch: 7/951 | step: 2805/6480 | trn_loss: 25.6546 | val_loss: 26.5960
epoch:

epoch: 7/951 | step: 4335/6480 | trn_loss: 24.5878 | val_loss: 24.5046
epoch: 7/951 | step: 4350/6480 | trn_loss: 23.7232 | val_loss: 24.8941
epoch: 7/951 | step: 4365/6480 | trn_loss: 23.9261 | val_loss: 24.8708
epoch: 7/951 | step: 4380/6480 | trn_loss: 24.4506 | val_loss: 26.4741
epoch: 7/951 | step: 4395/6480 | trn_loss: 25.6126 | val_loss: 27.5468
epoch: 7/951 | step: 4410/6480 | trn_loss: 25.0824 | val_loss: 24.9197
epoch: 7/951 | step: 4425/6480 | trn_loss: 24.2851 | val_loss: 25.8964
epoch: 7/951 | step: 4440/6480 | trn_loss: 23.9831 | val_loss: 25.0665
epoch: 7/951 | step: 4455/6480 | trn_loss: 25.4161 | val_loss: 24.8618
epoch: 7/951 | step: 4470/6480 | trn_loss: 25.7181 | val_loss: 25.3011
epoch: 7/951 | step: 4485/6480 | trn_loss: 24.2928 | val_loss: 26.9224
epoch: 7/951 | step: 4500/6480 | trn_loss: 23.7928 | val_loss: 25.1224
epoch: 7/951 | step: 4515/6480 | trn_loss: 25.2363 | val_loss: 25.7192
epoch: 7/951 | step: 4530/6480 | trn_loss: 24.8468 | val_loss: 26.5097
epoch:

epoch: 7/951 | step: 6060/6480 | trn_loss: 24.0082 | val_loss: 26.6112
epoch: 7/951 | step: 6075/6480 | trn_loss: 24.7239 | val_loss: 25.4628
epoch: 7/951 | step: 6090/6480 | trn_loss: 24.2150 | val_loss: 25.3204
epoch: 7/951 | step: 6105/6480 | trn_loss: 24.5615 | val_loss: 25.3195
epoch: 7/951 | step: 6120/6480 | trn_loss: 24.8838 | val_loss: 24.9741
epoch: 7/951 | step: 6135/6480 | trn_loss: 24.5092 | val_loss: 25.6646
epoch: 7/951 | step: 6150/6480 | trn_loss: 24.6097 | val_loss: 25.5163
epoch: 7/951 | step: 6165/6480 | trn_loss: 24.0960 | val_loss: 24.5558
epoch: 7/951 | step: 6180/6480 | trn_loss: 23.9714 | val_loss: 25.5870
epoch: 7/951 | step: 6195/6480 | trn_loss: 24.7642 | val_loss: 25.6601
epoch: 7/951 | step: 6210/6480 | trn_loss: 25.1143 | val_loss: 27.4986
epoch: 7/951 | step: 6225/6480 | trn_loss: 24.6484 | val_loss: 28.9890
epoch: 7/951 | step: 6240/6480 | trn_loss: 24.6059 | val_loss: 25.0611
epoch: 7/951 | step: 6255/6480 | trn_loss: 24.1933 | val_loss: 25.4742
epoch:

epoch: 8/951 | step: 1320/6480 | trn_loss: 25.2401 | val_loss: 25.7649
epoch: 8/951 | step: 1335/6480 | trn_loss: 23.8445 | val_loss: 24.7358
epoch: 8/951 | step: 1350/6480 | trn_loss: 24.7493 | val_loss: 25.4345
epoch: 8/951 | step: 1365/6480 | trn_loss: 23.4551 | val_loss: 23.9769
epoch: 8/951 | step: 1380/6480 | trn_loss: 24.2525 | val_loss: 24.5251
epoch: 8/951 | step: 1395/6480 | trn_loss: 23.9875 | val_loss: 24.4775
epoch: 8/951 | step: 1410/6480 | trn_loss: 24.4506 | val_loss: 25.1580
epoch: 8/951 | step: 1425/6480 | trn_loss: 24.1103 | val_loss: 25.1839
epoch: 8/951 | step: 1440/6480 | trn_loss: 23.9729 | val_loss: 24.6594
epoch: 8/951 | step: 1455/6480 | trn_loss: 23.4964 | val_loss: 24.0759
epoch: 8/951 | step: 1470/6480 | trn_loss: 24.1544 | val_loss: 24.4928
epoch: 8/951 | step: 1485/6480 | trn_loss: 24.9953 | val_loss: 26.8399
epoch: 8/951 | step: 1500/6480 | trn_loss: 24.6334 | val_loss: 26.6592
epoch: 8/951 | step: 1515/6480 | trn_loss: 23.9359 | val_loss: 25.7178
epoch:

epoch: 8/951 | step: 3045/6480 | trn_loss: 24.0995 | val_loss: 23.9667
epoch: 8/951 | step: 3060/6480 | trn_loss: 23.8003 | val_loss: 24.4715
epoch: 8/951 | step: 3075/6480 | trn_loss: 25.0528 | val_loss: 23.8195
epoch: 8/951 | step: 3090/6480 | trn_loss: 23.5501 | val_loss: 24.2335
epoch: 8/951 | step: 3105/6480 | trn_loss: 24.2569 | val_loss: 25.2210
epoch: 8/951 | step: 3120/6480 | trn_loss: 23.8398 | val_loss: 23.9274
epoch: 8/951 | step: 3135/6480 | trn_loss: 23.2214 | val_loss: 24.5879
epoch: 8/951 | step: 3150/6480 | trn_loss: 23.7257 | val_loss: 26.5652
epoch: 8/951 | step: 3165/6480 | trn_loss: 24.7783 | val_loss: 24.7565
epoch: 8/951 | step: 3180/6480 | trn_loss: 25.0039 | val_loss: 25.2953
epoch: 8/951 | step: 3195/6480 | trn_loss: 24.3573 | val_loss: 24.5968
epoch: 8/951 | step: 3210/6480 | trn_loss: 24.3104 | val_loss: 25.8983
epoch: 8/951 | step: 3225/6480 | trn_loss: 24.2355 | val_loss: 24.6773
epoch: 8/951 | step: 3240/6480 | trn_loss: 24.1484 | val_loss: 24.8934
epoch:

epoch: 8/951 | step: 4770/6480 | trn_loss: 25.4254 | val_loss: 24.5353
epoch: 8/951 | step: 4785/6480 | trn_loss: 25.0537 | val_loss: 25.3181
epoch: 8/951 | step: 4800/6480 | trn_loss: 24.1454 | val_loss: 23.5535
epoch: 8/951 | step: 4815/6480 | trn_loss: 23.3725 | val_loss: 24.5617
epoch: 8/951 | step: 4830/6480 | trn_loss: 24.6059 | val_loss: 24.4472
epoch: 8/951 | step: 4845/6480 | trn_loss: 23.2079 | val_loss: 24.3244
epoch: 8/951 | step: 4860/6480 | trn_loss: 23.4941 | val_loss: 24.6005
epoch: 8/951 | step: 4875/6480 | trn_loss: 24.8107 | val_loss: 24.8343
epoch: 8/951 | step: 4890/6480 | trn_loss: 25.2411 | val_loss: 24.8880
epoch: 8/951 | step: 4905/6480 | trn_loss: 24.6740 | val_loss: 24.6576
epoch: 8/951 | step: 4920/6480 | trn_loss: 24.7845 | val_loss: 26.3069
epoch: 8/951 | step: 4935/6480 | trn_loss: 24.7947 | val_loss: 25.5105
epoch: 8/951 | step: 4950/6480 | trn_loss: 24.9256 | val_loss: 25.6910
epoch: 8/951 | step: 4965/6480 | trn_loss: 24.8374 | val_loss: 26.7366
epoch:

epoch: 9/951 | step: 15/6480 | trn_loss: 24.1475 | val_loss: 25.5175
epoch: 9/951 | step: 30/6480 | trn_loss: 23.6405 | val_loss: 25.5210
epoch: 9/951 | step: 45/6480 | trn_loss: 24.3041 | val_loss: 26.0822
epoch: 9/951 | step: 60/6480 | trn_loss: 24.3409 | val_loss: 24.4820
epoch: 9/951 | step: 75/6480 | trn_loss: 23.1736 | val_loss: 28.5773
epoch: 9/951 | step: 90/6480 | trn_loss: 24.6104 | val_loss: 23.9646
epoch: 9/951 | step: 105/6480 | trn_loss: 22.6694 | val_loss: 24.7293
epoch: 9/951 | step: 120/6480 | trn_loss: 23.7100 | val_loss: 25.4111
epoch: 9/951 | step: 135/6480 | trn_loss: 23.6980 | val_loss: 24.9083
epoch: 9/951 | step: 150/6480 | trn_loss: 23.6591 | val_loss: 24.6001
epoch: 9/951 | step: 165/6480 | trn_loss: 23.3625 | val_loss: 24.2236
epoch: 9/951 | step: 180/6480 | trn_loss: 23.2796 | val_loss: 26.1910
epoch: 9/951 | step: 195/6480 | trn_loss: 24.0143 | val_loss: 25.9337
epoch: 9/951 | step: 210/6480 | trn_loss: 23.5433 | val_loss: 23.8147
epoch: 9/951 | step: 225/6

epoch: 9/951 | step: 1755/6480 | trn_loss: 23.4468 | val_loss: 25.2225
epoch: 9/951 | step: 1770/6480 | trn_loss: 23.9119 | val_loss: 24.0344
epoch: 9/951 | step: 1785/6480 | trn_loss: 23.3762 | val_loss: 24.1725
epoch: 9/951 | step: 1800/6480 | trn_loss: 24.3231 | val_loss: 24.4916
epoch: 9/951 | step: 1815/6480 | trn_loss: 25.4551 | val_loss: 25.3048
epoch: 9/951 | step: 1830/6480 | trn_loss: 23.2838 | val_loss: 24.6115
epoch: 9/951 | step: 1845/6480 | trn_loss: 24.3525 | val_loss: 23.4238
epoch: 9/951 | step: 1860/6480 | trn_loss: 23.5179 | val_loss: 24.8217
epoch: 9/951 | step: 1875/6480 | trn_loss: 23.7323 | val_loss: 25.5795
epoch: 9/951 | step: 1890/6480 | trn_loss: 24.4801 | val_loss: 25.1600
epoch: 9/951 | step: 1905/6480 | trn_loss: 23.9527 | val_loss: 25.4000
epoch: 9/951 | step: 1920/6480 | trn_loss: 24.1222 | val_loss: 24.6504
epoch: 9/951 | step: 1935/6480 | trn_loss: 23.3995 | val_loss: 24.6429
epoch: 9/951 | step: 1950/6480 | trn_loss: 23.6096 | val_loss: 24.4090
epoch:

epoch: 9/951 | step: 3480/6480 | trn_loss: 24.3255 | val_loss: 26.7611
epoch: 9/951 | step: 3495/6480 | trn_loss: 23.0413 | val_loss: 24.8327
epoch: 9/951 | step: 3510/6480 | trn_loss: 23.8160 | val_loss: 24.2173
epoch: 9/951 | step: 3525/6480 | trn_loss: 23.8704 | val_loss: 23.8849
epoch: 9/951 | step: 3540/6480 | trn_loss: 23.4361 | val_loss: 24.4073
epoch: 9/951 | step: 3555/6480 | trn_loss: 24.0593 | val_loss: 24.6358
epoch: 9/951 | step: 3570/6480 | trn_loss: 24.1483 | val_loss: 24.6808
epoch: 9/951 | step: 3585/6480 | trn_loss: 24.2363 | val_loss: 24.2883
epoch: 9/951 | step: 3600/6480 | trn_loss: 23.9688 | val_loss: 24.5021
epoch: 9/951 | step: 3615/6480 | trn_loss: 24.2502 | val_loss: 24.3856
epoch: 9/951 | step: 3630/6480 | trn_loss: 24.4861 | val_loss: 24.7929
epoch: 9/951 | step: 3645/6480 | trn_loss: 23.2136 | val_loss: 24.5190
epoch: 9/951 | step: 3660/6480 | trn_loss: 23.0166 | val_loss: 24.4621
epoch: 9/951 | step: 3675/6480 | trn_loss: 23.3399 | val_loss: 23.9690
epoch:

epoch: 9/951 | step: 5205/6480 | trn_loss: 24.3214 | val_loss: 24.4320
epoch: 9/951 | step: 5220/6480 | trn_loss: 23.1949 | val_loss: 24.3836
epoch: 9/951 | step: 5235/6480 | trn_loss: 24.1552 | val_loss: 24.7210
epoch: 9/951 | step: 5250/6480 | trn_loss: 23.9889 | val_loss: 25.3744
epoch: 9/951 | step: 5265/6480 | trn_loss: 23.6749 | val_loss: 23.5887
epoch: 9/951 | step: 5280/6480 | trn_loss: 24.1037 | val_loss: 24.1132
epoch: 9/951 | step: 5295/6480 | trn_loss: 25.0766 | val_loss: 24.6482
epoch: 9/951 | step: 5310/6480 | trn_loss: 22.9561 | val_loss: 24.6086
epoch: 9/951 | step: 5325/6480 | trn_loss: 24.6014 | val_loss: 25.7326
epoch: 9/951 | step: 5340/6480 | trn_loss: 23.9345 | val_loss: 24.0451
epoch: 9/951 | step: 5355/6480 | trn_loss: 23.0154 | val_loss: 27.5189
epoch: 9/951 | step: 5370/6480 | trn_loss: 23.7114 | val_loss: 24.6548
epoch: 9/951 | step: 5385/6480 | trn_loss: 23.6766 | val_loss: 24.5513
epoch: 9/951 | step: 5400/6480 | trn_loss: 24.2112 | val_loss: 25.9821
epoch:

epoch: 10/951 | step: 450/6480 | trn_loss: 23.6184 | val_loss: 24.5281
epoch: 10/951 | step: 465/6480 | trn_loss: 23.4558 | val_loss: 24.9482
epoch: 10/951 | step: 480/6480 | trn_loss: 24.3186 | val_loss: 23.8612
epoch: 10/951 | step: 495/6480 | trn_loss: 23.0470 | val_loss: 24.5940
epoch: 10/951 | step: 510/6480 | trn_loss: 23.8778 | val_loss: 24.7196
epoch: 10/951 | step: 525/6480 | trn_loss: 23.5040 | val_loss: 26.0440
epoch: 10/951 | step: 540/6480 | trn_loss: 24.2900 | val_loss: 24.0645
epoch: 10/951 | step: 555/6480 | trn_loss: 25.2417 | val_loss: 24.7356
epoch: 10/951 | step: 570/6480 | trn_loss: 24.5089 | val_loss: 24.7561
epoch: 10/951 | step: 585/6480 | trn_loss: 23.5637 | val_loss: 22.8040
epoch: 10/951 | step: 600/6480 | trn_loss: 24.1698 | val_loss: 23.6954
epoch: 10/951 | step: 615/6480 | trn_loss: 23.6748 | val_loss: 24.9439
epoch: 10/951 | step: 630/6480 | trn_loss: 24.0773 | val_loss: 24.2444
epoch: 10/951 | step: 645/6480 | trn_loss: 23.8588 | val_loss: 23.9437
epoch:

epoch: 10/951 | step: 2160/6480 | trn_loss: 22.5845 | val_loss: 24.7134
epoch: 10/951 | step: 2175/6480 | trn_loss: 23.7368 | val_loss: 25.4851
epoch: 10/951 | step: 2190/6480 | trn_loss: 23.8292 | val_loss: 24.0213
epoch: 10/951 | step: 2205/6480 | trn_loss: 24.4686 | val_loss: 24.5453
epoch: 10/951 | step: 2220/6480 | trn_loss: 24.0988 | val_loss: 23.7754
epoch: 10/951 | step: 2235/6480 | trn_loss: 23.7555 | val_loss: 23.4114
epoch: 10/951 | step: 2250/6480 | trn_loss: 23.9770 | val_loss: 24.7678
epoch: 10/951 | step: 2265/6480 | trn_loss: 25.0461 | val_loss: 24.8759
epoch: 10/951 | step: 2280/6480 | trn_loss: 23.7755 | val_loss: 24.8299
epoch: 10/951 | step: 2295/6480 | trn_loss: 24.4626 | val_loss: 24.6865
epoch: 10/951 | step: 2310/6480 | trn_loss: 24.0894 | val_loss: 23.6983
epoch: 10/951 | step: 2325/6480 | trn_loss: 23.1166 | val_loss: 24.2136
epoch: 10/951 | step: 2340/6480 | trn_loss: 23.4886 | val_loss: 24.2830
epoch: 10/951 | step: 2355/6480 | trn_loss: 22.9794 | val_loss: 

epoch: 10/951 | step: 3855/6480 | trn_loss: 23.9402 | val_loss: 23.6436
epoch: 10/951 | step: 3870/6480 | trn_loss: 24.4865 | val_loss: 24.0944
epoch: 10/951 | step: 3885/6480 | trn_loss: 24.0824 | val_loss: 24.1945
epoch: 10/951 | step: 3900/6480 | trn_loss: 23.7832 | val_loss: 24.0267
epoch: 10/951 | step: 3915/6480 | trn_loss: 22.7411 | val_loss: 23.4186
epoch: 10/951 | step: 3930/6480 | trn_loss: 23.4212 | val_loss: 24.3057
epoch: 10/951 | step: 3945/6480 | trn_loss: 23.3376 | val_loss: 23.8740
epoch: 10/951 | step: 3960/6480 | trn_loss: 22.8710 | val_loss: 24.5321
epoch: 10/951 | step: 3975/6480 | trn_loss: 24.0087 | val_loss: 24.3868
epoch: 10/951 | step: 3990/6480 | trn_loss: 23.8625 | val_loss: 23.4096
epoch: 10/951 | step: 4005/6480 | trn_loss: 23.4151 | val_loss: 24.8228
epoch: 10/951 | step: 4020/6480 | trn_loss: 24.0757 | val_loss: 25.0529
epoch: 10/951 | step: 4035/6480 | trn_loss: 24.0868 | val_loss: 25.5531
epoch: 10/951 | step: 4050/6480 | trn_loss: 23.4347 | val_loss: 

epoch: 10/951 | step: 5550/6480 | trn_loss: 23.2395 | val_loss: 25.0178
epoch: 10/951 | step: 5565/6480 | trn_loss: 23.6550 | val_loss: 24.1288
epoch: 10/951 | step: 5580/6480 | trn_loss: 22.4621 | val_loss: 22.9634
epoch: 10/951 | step: 5595/6480 | trn_loss: 22.8784 | val_loss: 23.9350
epoch: 10/951 | step: 5610/6480 | trn_loss: 24.0439 | val_loss: 23.6618
epoch: 10/951 | step: 5625/6480 | trn_loss: 23.3159 | val_loss: 24.0089
epoch: 10/951 | step: 5640/6480 | trn_loss: 23.2489 | val_loss: 24.8362
epoch: 10/951 | step: 5655/6480 | trn_loss: 23.3661 | val_loss: 23.1713
epoch: 10/951 | step: 5670/6480 | trn_loss: 23.2977 | val_loss: 24.4303
epoch: 10/951 | step: 5685/6480 | trn_loss: 23.1646 | val_loss: 24.1526
epoch: 10/951 | step: 5700/6480 | trn_loss: 23.4177 | val_loss: 24.6285
epoch: 10/951 | step: 5715/6480 | trn_loss: 23.7223 | val_loss: 24.3690
epoch: 10/951 | step: 5730/6480 | trn_loss: 24.9851 | val_loss: 24.4795
epoch: 10/951 | step: 5745/6480 | trn_loss: 25.5432 | val_loss: 

epoch: 11/951 | step: 780/6480 | trn_loss: 22.8190 | val_loss: 24.4610
epoch: 11/951 | step: 795/6480 | trn_loss: 23.0577 | val_loss: 24.5164
epoch: 11/951 | step: 810/6480 | trn_loss: 23.2772 | val_loss: 23.9383
epoch: 11/951 | step: 825/6480 | trn_loss: 23.0760 | val_loss: 25.0284
epoch: 11/951 | step: 840/6480 | trn_loss: 23.4198 | val_loss: 24.7849
epoch: 11/951 | step: 855/6480 | trn_loss: 23.4265 | val_loss: 24.3920
epoch: 11/951 | step: 870/6480 | trn_loss: 24.0365 | val_loss: 25.9704
epoch: 11/951 | step: 885/6480 | trn_loss: 23.5144 | val_loss: 24.6880
epoch: 11/951 | step: 900/6480 | trn_loss: 23.4040 | val_loss: 23.8665
epoch: 11/951 | step: 915/6480 | trn_loss: 23.7932 | val_loss: 23.5356
epoch: 11/951 | step: 930/6480 | trn_loss: 23.2126 | val_loss: 23.2904
epoch: 11/951 | step: 945/6480 | trn_loss: 23.4343 | val_loss: 24.3790
epoch: 11/951 | step: 960/6480 | trn_loss: 22.9443 | val_loss: 24.2804
epoch: 11/951 | step: 975/6480 | trn_loss: 23.6564 | val_loss: 25.2410
epoch:

epoch: 11/951 | step: 2490/6480 | trn_loss: 23.3258 | val_loss: 23.5021
epoch: 11/951 | step: 2505/6480 | trn_loss: 22.6841 | val_loss: 23.4590
epoch: 11/951 | step: 2520/6480 | trn_loss: 22.9954 | val_loss: 23.6675
epoch: 11/951 | step: 2535/6480 | trn_loss: 24.3952 | val_loss: 24.7815
epoch: 11/951 | step: 2550/6480 | trn_loss: 23.5318 | val_loss: 23.7408
epoch: 11/951 | step: 2565/6480 | trn_loss: 23.3379 | val_loss: 24.6209
epoch: 11/951 | step: 2580/6480 | trn_loss: 23.1914 | val_loss: 23.5361
epoch: 11/951 | step: 2595/6480 | trn_loss: 22.7791 | val_loss: 25.0826
epoch: 11/951 | step: 2610/6480 | trn_loss: 22.6556 | val_loss: 24.8534
epoch: 11/951 | step: 2625/6480 | trn_loss: 23.1499 | val_loss: 24.4020
epoch: 11/951 | step: 2640/6480 | trn_loss: 24.8067 | val_loss: 24.0242
epoch: 11/951 | step: 2655/6480 | trn_loss: 23.8921 | val_loss: 24.0202
epoch: 11/951 | step: 2670/6480 | trn_loss: 23.2803 | val_loss: 23.5942
epoch: 11/951 | step: 2685/6480 | trn_loss: 23.2659 | val_loss: 

epoch: 11/951 | step: 4185/6480 | trn_loss: 24.2839 | val_loss: 24.9434
epoch: 11/951 | step: 4200/6480 | trn_loss: 23.1193 | val_loss: 23.8841
epoch: 11/951 | step: 4215/6480 | trn_loss: 23.6275 | val_loss: 23.9609
epoch: 11/951 | step: 4230/6480 | trn_loss: 22.6572 | val_loss: 25.2086
epoch: 11/951 | step: 4245/6480 | trn_loss: 24.2018 | val_loss: 23.8210
epoch: 11/951 | step: 4260/6480 | trn_loss: 23.7027 | val_loss: 23.2297
epoch: 11/951 | step: 4275/6480 | trn_loss: 22.8594 | val_loss: 25.0364
epoch: 11/951 | step: 4290/6480 | trn_loss: 23.7212 | val_loss: 23.9320
epoch: 11/951 | step: 4305/6480 | trn_loss: 22.2106 | val_loss: 22.9281
epoch: 11/951 | step: 4320/6480 | trn_loss: 23.5058 | val_loss: 23.6272
epoch: 11/951 | step: 4335/6480 | trn_loss: 23.3179 | val_loss: 25.0572
epoch: 11/951 | step: 4350/6480 | trn_loss: 23.2481 | val_loss: 24.0119
epoch: 11/951 | step: 4365/6480 | trn_loss: 22.7864 | val_loss: 23.6321
epoch: 11/951 | step: 4380/6480 | trn_loss: 22.2206 | val_loss: 

epoch: 11/951 | step: 5880/6480 | trn_loss: 23.0356 | val_loss: 24.2605
epoch: 11/951 | step: 5895/6480 | trn_loss: 24.2150 | val_loss: 24.4057
epoch: 11/951 | step: 5910/6480 | trn_loss: 23.8022 | val_loss: 24.1860
epoch: 11/951 | step: 5925/6480 | trn_loss: 22.9944 | val_loss: 24.6051
epoch: 11/951 | step: 5940/6480 | trn_loss: 23.2436 | val_loss: 24.8929
epoch: 11/951 | step: 5955/6480 | trn_loss: 23.7268 | val_loss: 26.0823
epoch: 11/951 | step: 5970/6480 | trn_loss: 23.4986 | val_loss: 25.4039
epoch: 11/951 | step: 5985/6480 | trn_loss: 22.7428 | val_loss: 24.0963
epoch: 11/951 | step: 6000/6480 | trn_loss: 23.2718 | val_loss: 24.1580
epoch: 11/951 | step: 6015/6480 | trn_loss: 22.8869 | val_loss: 22.8999
epoch: 11/951 | step: 6030/6480 | trn_loss: 23.2237 | val_loss: 25.5330
epoch: 11/951 | step: 6045/6480 | trn_loss: 23.7915 | val_loss: 24.1669
epoch: 11/951 | step: 6060/6480 | trn_loss: 23.2142 | val_loss: 25.4848
epoch: 11/951 | step: 6075/6480 | trn_loss: 23.4393 | val_loss: 

epoch: 12/951 | step: 1110/6480 | trn_loss: 23.5524 | val_loss: 24.2441
epoch: 12/951 | step: 1125/6480 | trn_loss: 23.5226 | val_loss: 24.3683
epoch: 12/951 | step: 1140/6480 | trn_loss: 22.3008 | val_loss: 23.9386
epoch: 12/951 | step: 1155/6480 | trn_loss: 23.6271 | val_loss: 24.1465
epoch: 12/951 | step: 1170/6480 | trn_loss: 23.2882 | val_loss: 22.9403
epoch: 12/951 | step: 1185/6480 | trn_loss: 22.6764 | val_loss: 23.4440
epoch: 12/951 | step: 1200/6480 | trn_loss: 23.5188 | val_loss: 25.4774
epoch: 12/951 | step: 1215/6480 | trn_loss: 22.9721 | val_loss: 23.9708
epoch: 12/951 | step: 1230/6480 | trn_loss: 22.8338 | val_loss: 24.2883
epoch: 12/951 | step: 1245/6480 | trn_loss: 23.6569 | val_loss: 26.6090
epoch: 12/951 | step: 1260/6480 | trn_loss: 23.4126 | val_loss: 24.0435
epoch: 12/951 | step: 1275/6480 | trn_loss: 23.0613 | val_loss: 23.5223
epoch: 12/951 | step: 1290/6480 | trn_loss: 23.1369 | val_loss: 24.2207
epoch: 12/951 | step: 1305/6480 | trn_loss: 23.0460 | val_loss: 

epoch: 12/951 | step: 2805/6480 | trn_loss: 24.2919 | val_loss: 24.6038
epoch: 12/951 | step: 2820/6480 | trn_loss: 23.9833 | val_loss: 24.2533
epoch: 12/951 | step: 2835/6480 | trn_loss: 23.6984 | val_loss: 23.4392
epoch: 12/951 | step: 2850/6480 | trn_loss: 24.3140 | val_loss: 23.6577
epoch: 12/951 | step: 2865/6480 | trn_loss: 23.0811 | val_loss: 23.1466
epoch: 12/951 | step: 2880/6480 | trn_loss: 22.6654 | val_loss: 23.2824
epoch: 12/951 | step: 2895/6480 | trn_loss: 23.0759 | val_loss: 25.4655
epoch: 12/951 | step: 2910/6480 | trn_loss: 23.3972 | val_loss: 24.1165
epoch: 12/951 | step: 2925/6480 | trn_loss: 24.5335 | val_loss: 23.3697
epoch: 12/951 | step: 2940/6480 | trn_loss: 23.7364 | val_loss: 24.6653
epoch: 12/951 | step: 2955/6480 | trn_loss: 23.0528 | val_loss: 23.4594
epoch: 12/951 | step: 2970/6480 | trn_loss: 23.7089 | val_loss: 24.3196
epoch: 12/951 | step: 2985/6480 | trn_loss: 22.5322 | val_loss: 23.4622
epoch: 12/951 | step: 3000/6480 | trn_loss: 23.5241 | val_loss: 

epoch: 12/951 | step: 4500/6480 | trn_loss: 23.0589 | val_loss: 22.7651
epoch: 12/951 | step: 4515/6480 | trn_loss: 22.4785 | val_loss: 25.4028
epoch: 12/951 | step: 4530/6480 | trn_loss: 23.7291 | val_loss: 23.8604
epoch: 12/951 | step: 4545/6480 | trn_loss: 23.2547 | val_loss: 23.4425
epoch: 12/951 | step: 4560/6480 | trn_loss: 23.1073 | val_loss: 24.3392
epoch: 12/951 | step: 4575/6480 | trn_loss: 23.3397 | val_loss: 23.9398
epoch: 12/951 | step: 4590/6480 | trn_loss: 24.2685 | val_loss: 23.0716
epoch: 12/951 | step: 4605/6480 | trn_loss: 22.6622 | val_loss: 23.7056
epoch: 12/951 | step: 4620/6480 | trn_loss: 23.4708 | val_loss: 23.4317
epoch: 12/951 | step: 4635/6480 | trn_loss: 23.3325 | val_loss: 24.8374
epoch: 12/951 | step: 4650/6480 | trn_loss: 23.6239 | val_loss: 23.1244
epoch: 12/951 | step: 4665/6480 | trn_loss: 23.6733 | val_loss: 24.4167
epoch: 12/951 | step: 4680/6480 | trn_loss: 22.6665 | val_loss: 23.3308
epoch: 12/951 | step: 4695/6480 | trn_loss: 23.0576 | val_loss: 

epoch: 12/951 | step: 6195/6480 | trn_loss: 23.6114 | val_loss: 24.9245
epoch: 12/951 | step: 6210/6480 | trn_loss: 22.7117 | val_loss: 23.8721
epoch: 12/951 | step: 6225/6480 | trn_loss: 23.1294 | val_loss: 23.6374
epoch: 12/951 | step: 6240/6480 | trn_loss: 23.0573 | val_loss: 22.7790
epoch: 12/951 | step: 6255/6480 | trn_loss: 22.7593 | val_loss: 24.3659
epoch: 12/951 | step: 6270/6480 | trn_loss: 24.3300 | val_loss: 25.0459
epoch: 12/951 | step: 6285/6480 | trn_loss: 22.8012 | val_loss: 23.4089
epoch: 12/951 | step: 6300/6480 | trn_loss: 23.1110 | val_loss: 24.9187
epoch: 12/951 | step: 6315/6480 | trn_loss: 24.2852 | val_loss: 25.3055
epoch: 12/951 | step: 6330/6480 | trn_loss: 23.8652 | val_loss: 24.2435
epoch: 12/951 | step: 6345/6480 | trn_loss: 24.1600 | val_loss: 23.6275
epoch: 12/951 | step: 6360/6480 | trn_loss: 23.0285 | val_loss: 23.4502
epoch: 12/951 | step: 6375/6480 | trn_loss: 22.8515 | val_loss: 23.4859
epoch: 12/951 | step: 6390/6480 | trn_loss: 23.4057 | val_loss: 

epoch: 13/951 | step: 1425/6480 | trn_loss: 23.5204 | val_loss: 23.6397
epoch: 13/951 | step: 1440/6480 | trn_loss: 22.3966 | val_loss: 24.3178
epoch: 13/951 | step: 1455/6480 | trn_loss: 24.4837 | val_loss: 23.4928
epoch: 13/951 | step: 1470/6480 | trn_loss: 22.9518 | val_loss: 24.0308
epoch: 13/951 | step: 1485/6480 | trn_loss: 22.6336 | val_loss: 24.2767
epoch: 13/951 | step: 1500/6480 | trn_loss: 23.5816 | val_loss: 24.1968
epoch: 13/951 | step: 1515/6480 | trn_loss: 23.5277 | val_loss: 24.4499
epoch: 13/951 | step: 1530/6480 | trn_loss: 22.9496 | val_loss: 24.2152
epoch: 13/951 | step: 1545/6480 | trn_loss: 23.1526 | val_loss: 22.7366
epoch: 13/951 | step: 1560/6480 | trn_loss: 22.6780 | val_loss: 22.8695
epoch: 13/951 | step: 1575/6480 | trn_loss: 22.7012 | val_loss: 23.3967
epoch: 13/951 | step: 1590/6480 | trn_loss: 23.4497 | val_loss: 24.5058
epoch: 13/951 | step: 1605/6480 | trn_loss: 22.4786 | val_loss: 25.4490
epoch: 13/951 | step: 1620/6480 | trn_loss: 22.4052 | val_loss: 

epoch: 13/951 | step: 3120/6480 | trn_loss: 21.9124 | val_loss: 23.9819
epoch: 13/951 | step: 3135/6480 | trn_loss: 23.7348 | val_loss: 24.1201
epoch: 13/951 | step: 3150/6480 | trn_loss: 23.0950 | val_loss: 23.6634
epoch: 13/951 | step: 3165/6480 | trn_loss: 22.7334 | val_loss: 23.5272
epoch: 13/951 | step: 3180/6480 | trn_loss: 22.4934 | val_loss: 25.3431
epoch: 13/951 | step: 3195/6480 | trn_loss: 23.0362 | val_loss: 23.6360
epoch: 13/951 | step: 3210/6480 | trn_loss: 23.3807 | val_loss: 24.4628
epoch: 13/951 | step: 3225/6480 | trn_loss: 23.0230 | val_loss: 23.8596
epoch: 13/951 | step: 3240/6480 | trn_loss: 22.9933 | val_loss: 23.4197
epoch: 13/951 | step: 3255/6480 | trn_loss: 23.4179 | val_loss: 23.3897
epoch: 13/951 | step: 3270/6480 | trn_loss: 22.4545 | val_loss: 23.6119
epoch: 13/951 | step: 3285/6480 | trn_loss: 23.0625 | val_loss: 24.8095
epoch: 13/951 | step: 3300/6480 | trn_loss: 22.2294 | val_loss: 23.0794
epoch: 13/951 | step: 3315/6480 | trn_loss: 22.8059 | val_loss: 

epoch: 13/951 | step: 4815/6480 | trn_loss: 22.9103 | val_loss: 24.6254
epoch: 13/951 | step: 4830/6480 | trn_loss: 23.1230 | val_loss: 23.0400
epoch: 13/951 | step: 4845/6480 | trn_loss: 22.8251 | val_loss: 26.5011
epoch: 13/951 | step: 4860/6480 | trn_loss: 22.2417 | val_loss: 23.2288
epoch: 13/951 | step: 4875/6480 | trn_loss: 22.4468 | val_loss: 24.2764
epoch: 13/951 | step: 4890/6480 | trn_loss: 23.4067 | val_loss: 23.6134
epoch: 13/951 | step: 4905/6480 | trn_loss: 21.8322 | val_loss: 22.2073
epoch: 13/951 | step: 4920/6480 | trn_loss: 21.5164 | val_loss: 22.6882
epoch: 13/951 | step: 4935/6480 | trn_loss: 22.3858 | val_loss: 25.2584
epoch: 13/951 | step: 4950/6480 | trn_loss: 23.6997 | val_loss: 25.2339
epoch: 13/951 | step: 4965/6480 | trn_loss: 23.0338 | val_loss: 26.5270
epoch: 13/951 | step: 4980/6480 | trn_loss: 22.8722 | val_loss: 22.7179
epoch: 13/951 | step: 4995/6480 | trn_loss: 22.2787 | val_loss: 23.0928
epoch: 13/951 | step: 5010/6480 | trn_loss: 23.8281 | val_loss: 

epoch: 14/951 | step: 30/6480 | trn_loss: 22.6304 | val_loss: 23.3377
epoch: 14/951 | step: 45/6480 | trn_loss: 23.3574 | val_loss: 23.4223
epoch: 14/951 | step: 60/6480 | trn_loss: 22.8968 | val_loss: 22.8911
epoch: 14/951 | step: 75/6480 | trn_loss: 22.7422 | val_loss: 23.4114
epoch: 14/951 | step: 90/6480 | trn_loss: 23.1898 | val_loss: 24.7706
epoch: 14/951 | step: 105/6480 | trn_loss: 24.2394 | val_loss: 23.9801
epoch: 14/951 | step: 120/6480 | trn_loss: 22.4226 | val_loss: 24.2634
epoch: 14/951 | step: 135/6480 | trn_loss: 23.0756 | val_loss: 23.7999
epoch: 14/951 | step: 150/6480 | trn_loss: 22.9346 | val_loss: 23.0721
epoch: 14/951 | step: 165/6480 | trn_loss: 22.5995 | val_loss: 22.9498
epoch: 14/951 | step: 180/6480 | trn_loss: 22.0075 | val_loss: 23.0983
epoch: 14/951 | step: 195/6480 | trn_loss: 22.7063 | val_loss: 23.0831
epoch: 14/951 | step: 210/6480 | trn_loss: 22.9461 | val_loss: 23.6185
epoch: 14/951 | step: 225/6480 | trn_loss: 22.1051 | val_loss: 23.0713
epoch: 14/9

epoch: 14/951 | step: 1740/6480 | trn_loss: 22.5221 | val_loss: 23.8424
epoch: 14/951 | step: 1755/6480 | trn_loss: 22.2792 | val_loss: 23.9248
epoch: 14/951 | step: 1770/6480 | trn_loss: 22.8220 | val_loss: 23.0551
epoch: 14/951 | step: 1785/6480 | trn_loss: 22.0592 | val_loss: 23.3426
epoch: 14/951 | step: 1800/6480 | trn_loss: 23.4462 | val_loss: 23.4677
epoch: 14/951 | step: 1815/6480 | trn_loss: 22.3412 | val_loss: 22.7872
epoch: 14/951 | step: 1830/6480 | trn_loss: 22.4662 | val_loss: 23.2066
epoch: 14/951 | step: 1845/6480 | trn_loss: 22.5206 | val_loss: 23.5209
epoch: 14/951 | step: 1860/6480 | trn_loss: 22.2104 | val_loss: 23.4567
epoch: 14/951 | step: 1875/6480 | trn_loss: 22.3400 | val_loss: 22.8985
epoch: 14/951 | step: 1890/6480 | trn_loss: 21.7107 | val_loss: 24.1540
epoch: 14/951 | step: 1905/6480 | trn_loss: 23.7981 | val_loss: 24.9358
epoch: 14/951 | step: 1920/6480 | trn_loss: 24.3995 | val_loss: 24.1735
epoch: 14/951 | step: 1935/6480 | trn_loss: 23.8210 | val_loss: 

epoch: 14/951 | step: 3435/6480 | trn_loss: 22.1841 | val_loss: 25.7270
epoch: 14/951 | step: 3450/6480 | trn_loss: 22.7285 | val_loss: 26.5505
epoch: 14/951 | step: 3465/6480 | trn_loss: 22.5499 | val_loss: 22.8065
epoch: 14/951 | step: 3480/6480 | trn_loss: 22.6178 | val_loss: 24.3084
epoch: 14/951 | step: 3495/6480 | trn_loss: 23.2744 | val_loss: 22.8353
epoch: 14/951 | step: 3510/6480 | trn_loss: 22.4546 | val_loss: 22.9261
epoch: 14/951 | step: 3525/6480 | trn_loss: 22.9117 | val_loss: 23.3669
epoch: 14/951 | step: 3540/6480 | trn_loss: 22.4609 | val_loss: 23.3765
epoch: 14/951 | step: 3555/6480 | trn_loss: 22.4942 | val_loss: 23.5077
epoch: 14/951 | step: 3570/6480 | trn_loss: 22.5094 | val_loss: 25.2682
epoch: 14/951 | step: 3585/6480 | trn_loss: 22.7626 | val_loss: 22.7697
epoch: 14/951 | step: 3600/6480 | trn_loss: 22.2885 | val_loss: 23.2506
epoch: 14/951 | step: 3615/6480 | trn_loss: 21.9994 | val_loss: 23.4279
epoch: 14/951 | step: 3630/6480 | trn_loss: 22.6387 | val_loss: 

epoch: 14/951 | step: 5130/6480 | trn_loss: 22.5862 | val_loss: 22.4129
epoch: 14/951 | step: 5145/6480 | trn_loss: 22.8620 | val_loss: 24.7445
epoch: 14/951 | step: 5160/6480 | trn_loss: 23.1591 | val_loss: 23.6287
epoch: 14/951 | step: 5175/6480 | trn_loss: 22.3139 | val_loss: 22.5595
epoch: 14/951 | step: 5190/6480 | trn_loss: 22.3111 | val_loss: 23.2483
epoch: 14/951 | step: 5205/6480 | trn_loss: 22.7455 | val_loss: 23.6500
epoch: 14/951 | step: 5220/6480 | trn_loss: 22.3072 | val_loss: 23.0764
epoch: 14/951 | step: 5235/6480 | trn_loss: 22.5636 | val_loss: 23.2120
epoch: 14/951 | step: 5250/6480 | trn_loss: 22.8493 | val_loss: 23.6134
epoch: 14/951 | step: 5265/6480 | trn_loss: 22.3219 | val_loss: 22.8326
epoch: 14/951 | step: 5280/6480 | trn_loss: 22.1351 | val_loss: 22.7846
epoch: 14/951 | step: 5295/6480 | trn_loss: 23.1804 | val_loss: 23.1195
epoch: 14/951 | step: 5310/6480 | trn_loss: 22.9736 | val_loss: 23.0054
epoch: 14/951 | step: 5325/6480 | trn_loss: 21.4734 | val_loss: 

epoch: 15/951 | step: 360/6480 | trn_loss: 22.8479 | val_loss: 27.2783
epoch: 15/951 | step: 375/6480 | trn_loss: 22.8582 | val_loss: 23.4184
epoch: 15/951 | step: 390/6480 | trn_loss: 22.7786 | val_loss: 22.6763
epoch: 15/951 | step: 405/6480 | trn_loss: 22.6057 | val_loss: 24.6861
epoch: 15/951 | step: 420/6480 | trn_loss: 23.6925 | val_loss: 23.7685
epoch: 15/951 | step: 435/6480 | trn_loss: 22.1224 | val_loss: 22.1710
epoch: 15/951 | step: 450/6480 | trn_loss: 21.8607 | val_loss: 23.2984
epoch: 15/951 | step: 465/6480 | trn_loss: 22.9453 | val_loss: 22.9551
epoch: 15/951 | step: 480/6480 | trn_loss: 22.6260 | val_loss: 23.6185
epoch: 15/951 | step: 495/6480 | trn_loss: 22.6891 | val_loss: 23.7889
epoch: 15/951 | step: 510/6480 | trn_loss: 23.0752 | val_loss: 23.9448
epoch: 15/951 | step: 525/6480 | trn_loss: 23.3952 | val_loss: 23.1464
epoch: 15/951 | step: 540/6480 | trn_loss: 22.0509 | val_loss: 22.9044
epoch: 15/951 | step: 555/6480 | trn_loss: 22.5627 | val_loss: 22.3766
epoch:

epoch: 15/951 | step: 2070/6480 | trn_loss: 22.0212 | val_loss: 22.9036
epoch: 15/951 | step: 2085/6480 | trn_loss: 23.1915 | val_loss: 23.7317
epoch: 15/951 | step: 2100/6480 | trn_loss: 22.1083 | val_loss: 23.8429
epoch: 15/951 | step: 2115/6480 | trn_loss: 23.2054 | val_loss: 25.0609
epoch: 15/951 | step: 2130/6480 | trn_loss: 22.2969 | val_loss: 22.9791
epoch: 15/951 | step: 2145/6480 | trn_loss: 22.1056 | val_loss: 23.1483
epoch: 15/951 | step: 2160/6480 | trn_loss: 21.7202 | val_loss: 23.4754
epoch: 15/951 | step: 2175/6480 | trn_loss: 24.1926 | val_loss: 23.5147
epoch: 15/951 | step: 2190/6480 | trn_loss: 23.3564 | val_loss: 23.1533
epoch: 15/951 | step: 2205/6480 | trn_loss: 22.6847 | val_loss: 23.7453
epoch: 15/951 | step: 2220/6480 | trn_loss: 22.3001 | val_loss: 23.6264
epoch: 15/951 | step: 2235/6480 | trn_loss: 21.7306 | val_loss: 23.8188
epoch: 15/951 | step: 2250/6480 | trn_loss: 22.1191 | val_loss: 24.1245
epoch: 15/951 | step: 2265/6480 | trn_loss: 22.0290 | val_loss: 

epoch: 15/951 | step: 3765/6480 | trn_loss: 22.4996 | val_loss: 22.3542
epoch: 15/951 | step: 3780/6480 | trn_loss: 23.2811 | val_loss: 23.0872
epoch: 15/951 | step: 3795/6480 | trn_loss: 22.6935 | val_loss: 22.9625
epoch: 15/951 | step: 3810/6480 | trn_loss: 23.3958 | val_loss: 24.2225
epoch: 15/951 | step: 3825/6480 | trn_loss: 22.3515 | val_loss: 22.5760
epoch: 15/951 | step: 3840/6480 | trn_loss: 21.7664 | val_loss: 22.5771
epoch: 15/951 | step: 3855/6480 | trn_loss: 21.8865 | val_loss: 22.5477
epoch: 15/951 | step: 3870/6480 | trn_loss: 22.0531 | val_loss: 22.6408
epoch: 15/951 | step: 3885/6480 | trn_loss: 21.9820 | val_loss: 23.3989
epoch: 15/951 | step: 3900/6480 | trn_loss: 22.7470 | val_loss: 22.8012
epoch: 15/951 | step: 3915/6480 | trn_loss: 21.9213 | val_loss: 23.5161
epoch: 15/951 | step: 3930/6480 | trn_loss: 22.4902 | val_loss: 22.4434
epoch: 15/951 | step: 3945/6480 | trn_loss: 22.3439 | val_loss: 23.3715
epoch: 15/951 | step: 3960/6480 | trn_loss: 22.1870 | val_loss: 

epoch: 15/951 | step: 5460/6480 | trn_loss: 22.5438 | val_loss: 23.5207
epoch: 15/951 | step: 5475/6480 | trn_loss: 22.4992 | val_loss: 22.2009
epoch: 15/951 | step: 5490/6480 | trn_loss: 23.3716 | val_loss: 23.0112
epoch: 15/951 | step: 5505/6480 | trn_loss: 22.9958 | val_loss: 24.9588
epoch: 15/951 | step: 5520/6480 | trn_loss: 22.9549 | val_loss: 25.9591
epoch: 15/951 | step: 5535/6480 | trn_loss: 23.6046 | val_loss: 22.4863
epoch: 15/951 | step: 5550/6480 | trn_loss: 23.1923 | val_loss: 23.3809
epoch: 15/951 | step: 5565/6480 | trn_loss: 21.8202 | val_loss: 23.2252
epoch: 15/951 | step: 5580/6480 | trn_loss: 21.6857 | val_loss: 24.3199
epoch: 15/951 | step: 5595/6480 | trn_loss: 22.9447 | val_loss: 24.4148
epoch: 15/951 | step: 5610/6480 | trn_loss: 22.5088 | val_loss: 22.4767
epoch: 15/951 | step: 5625/6480 | trn_loss: 23.5023 | val_loss: 22.2954
epoch: 15/951 | step: 5640/6480 | trn_loss: 21.9907 | val_loss: 22.9147
epoch: 15/951 | step: 5655/6480 | trn_loss: 21.9542 | val_loss: 

epoch: 16/951 | step: 690/6480 | trn_loss: 22.0372 | val_loss: 23.0211
epoch: 16/951 | step: 705/6480 | trn_loss: 21.8496 | val_loss: 22.1785
epoch: 16/951 | step: 720/6480 | trn_loss: 21.4657 | val_loss: 23.6121
epoch: 16/951 | step: 735/6480 | trn_loss: 22.4418 | val_loss: 24.0278
epoch: 16/951 | step: 750/6480 | trn_loss: 22.2611 | val_loss: 22.1142
epoch: 16/951 | step: 765/6480 | trn_loss: 21.3611 | val_loss: 22.1649
epoch: 16/951 | step: 780/6480 | trn_loss: 22.8973 | val_loss: 23.3804
epoch: 16/951 | step: 795/6480 | trn_loss: 22.3974 | val_loss: 23.6021
epoch: 16/951 | step: 810/6480 | trn_loss: 21.9818 | val_loss: 22.5532
epoch: 16/951 | step: 825/6480 | trn_loss: 22.2296 | val_loss: 22.6023
epoch: 16/951 | step: 840/6480 | trn_loss: 22.2285 | val_loss: 22.9165
epoch: 16/951 | step: 855/6480 | trn_loss: 23.3412 | val_loss: 22.7263
epoch: 16/951 | step: 870/6480 | trn_loss: 22.4843 | val_loss: 23.3811
epoch: 16/951 | step: 885/6480 | trn_loss: 21.9114 | val_loss: 21.8665
epoch:

epoch: 16/951 | step: 2400/6480 | trn_loss: 21.7728 | val_loss: 22.5015
epoch: 16/951 | step: 2415/6480 | trn_loss: 22.1937 | val_loss: 23.2351
epoch: 16/951 | step: 2430/6480 | trn_loss: 22.3691 | val_loss: 24.2481
epoch: 16/951 | step: 2445/6480 | trn_loss: 23.3641 | val_loss: 25.2025
epoch: 16/951 | step: 2460/6480 | trn_loss: 22.1708 | val_loss: 23.6135
epoch: 16/951 | step: 2475/6480 | trn_loss: 22.2645 | val_loss: 22.2006
epoch: 16/951 | step: 2490/6480 | trn_loss: 22.0465 | val_loss: 23.2499
epoch: 16/951 | step: 2505/6480 | trn_loss: 21.9626 | val_loss: 24.3523
epoch: 16/951 | step: 2520/6480 | trn_loss: 21.7678 | val_loss: 22.5455
epoch: 16/951 | step: 2535/6480 | trn_loss: 23.6869 | val_loss: 22.4623
epoch: 16/951 | step: 2550/6480 | trn_loss: 23.5854 | val_loss: 24.1045
epoch: 16/951 | step: 2565/6480 | trn_loss: 23.4179 | val_loss: 21.9539
epoch: 16/951 | step: 2580/6480 | trn_loss: 21.6545 | val_loss: 23.1716
epoch: 16/951 | step: 2595/6480 | trn_loss: 23.0341 | val_loss: 

epoch: 16/951 | step: 4095/6480 | trn_loss: 24.8985 | val_loss: 23.6232
epoch: 16/951 | step: 4110/6480 | trn_loss: 22.7669 | val_loss: 23.0853
epoch: 16/951 | step: 4125/6480 | trn_loss: 22.9683 | val_loss: 23.9700
epoch: 16/951 | step: 4140/6480 | trn_loss: 22.2762 | val_loss: 23.6703
epoch: 16/951 | step: 4155/6480 | trn_loss: 22.6777 | val_loss: 22.7387
epoch: 16/951 | step: 4170/6480 | trn_loss: 22.3904 | val_loss: 22.8135
epoch: 16/951 | step: 4185/6480 | trn_loss: 22.3096 | val_loss: 22.1750
epoch: 16/951 | step: 4200/6480 | trn_loss: 21.6423 | val_loss: 23.4721
epoch: 16/951 | step: 4215/6480 | trn_loss: 22.1456 | val_loss: 23.4134
epoch: 16/951 | step: 4230/6480 | trn_loss: 21.5412 | val_loss: 23.1127
epoch: 16/951 | step: 4245/6480 | trn_loss: 23.1329 | val_loss: 22.5281
epoch: 16/951 | step: 4260/6480 | trn_loss: 23.1001 | val_loss: 22.0126
epoch: 16/951 | step: 4275/6480 | trn_loss: 22.3515 | val_loss: 22.1975
epoch: 16/951 | step: 4290/6480 | trn_loss: 22.1982 | val_loss: 

epoch: 16/951 | step: 5790/6480 | trn_loss: 23.3247 | val_loss: 22.6024
epoch: 16/951 | step: 5805/6480 | trn_loss: 21.9496 | val_loss: 26.7049
epoch: 16/951 | step: 5820/6480 | trn_loss: 22.9105 | val_loss: 23.4919
epoch: 16/951 | step: 5835/6480 | trn_loss: 22.3503 | val_loss: 24.2735
epoch: 16/951 | step: 5850/6480 | trn_loss: 22.8925 | val_loss: 23.7652
epoch: 16/951 | step: 5865/6480 | trn_loss: 22.5232 | val_loss: 23.1372
epoch: 16/951 | step: 5880/6480 | trn_loss: 22.2214 | val_loss: 22.3542
epoch: 16/951 | step: 5895/6480 | trn_loss: 21.6819 | val_loss: 21.9841
epoch: 16/951 | step: 5910/6480 | trn_loss: 21.4113 | val_loss: 22.5726
epoch: 16/951 | step: 5925/6480 | trn_loss: 21.9879 | val_loss: 22.8262
epoch: 16/951 | step: 5940/6480 | trn_loss: 23.1155 | val_loss: 23.5077
epoch: 16/951 | step: 5955/6480 | trn_loss: 21.9488 | val_loss: 22.8100
epoch: 16/951 | step: 5970/6480 | trn_loss: 22.1839 | val_loss: 22.7850
epoch: 16/951 | step: 5985/6480 | trn_loss: 22.8940 | val_loss: 

epoch: 17/951 | step: 1020/6480 | trn_loss: 21.3570 | val_loss: 22.3018
epoch: 17/951 | step: 1035/6480 | trn_loss: 21.7733 | val_loss: 21.8580
epoch: 17/951 | step: 1050/6480 | trn_loss: 21.6974 | val_loss: 22.1393
epoch: 17/951 | step: 1065/6480 | trn_loss: 21.8790 | val_loss: 22.7672
epoch: 17/951 | step: 1080/6480 | trn_loss: 22.2683 | val_loss: 23.8630
epoch: 17/951 | step: 1095/6480 | trn_loss: 21.7784 | val_loss: 22.8408
epoch: 17/951 | step: 1110/6480 | trn_loss: 21.8889 | val_loss: 22.8808
epoch: 17/951 | step: 1125/6480 | trn_loss: 21.5822 | val_loss: 22.4878
epoch: 17/951 | step: 1140/6480 | trn_loss: 21.3530 | val_loss: 22.6438
epoch: 17/951 | step: 1155/6480 | trn_loss: 22.0309 | val_loss: 22.6199
epoch: 17/951 | step: 1170/6480 | trn_loss: 21.9729 | val_loss: 23.4641
epoch: 17/951 | step: 1185/6480 | trn_loss: 21.8762 | val_loss: 23.4710
epoch: 17/951 | step: 1200/6480 | trn_loss: 21.4953 | val_loss: 23.2726
epoch: 17/951 | step: 1215/6480 | trn_loss: 21.9897 | val_loss: 

epoch: 17/951 | step: 2715/6480 | trn_loss: 22.8102 | val_loss: 23.3369
epoch: 17/951 | step: 2730/6480 | trn_loss: 22.3121 | val_loss: 22.6771
epoch: 17/951 | step: 2745/6480 | trn_loss: 21.4970 | val_loss: 22.6650
epoch: 17/951 | step: 2760/6480 | trn_loss: 22.2358 | val_loss: 23.0529
epoch: 17/951 | step: 2775/6480 | trn_loss: 21.9099 | val_loss: 22.7355
epoch: 17/951 | step: 2790/6480 | trn_loss: 21.9324 | val_loss: 22.9916
epoch: 17/951 | step: 2805/6480 | trn_loss: 22.0278 | val_loss: 22.6589
epoch: 17/951 | step: 2820/6480 | trn_loss: 21.4026 | val_loss: 23.0016
epoch: 17/951 | step: 2835/6480 | trn_loss: 21.7970 | val_loss: 22.5789
epoch: 17/951 | step: 2850/6480 | trn_loss: 21.8559 | val_loss: 23.4458
epoch: 17/951 | step: 2865/6480 | trn_loss: 21.8769 | val_loss: 23.4234
epoch: 17/951 | step: 2880/6480 | trn_loss: 21.8599 | val_loss: 22.7925
epoch: 17/951 | step: 2895/6480 | trn_loss: 22.6637 | val_loss: 23.7699
epoch: 17/951 | step: 2910/6480 | trn_loss: 22.7389 | val_loss: 

epoch: 17/951 | step: 4410/6480 | trn_loss: 21.3620 | val_loss: 22.4250
epoch: 17/951 | step: 4425/6480 | trn_loss: 21.8973 | val_loss: 22.5900
epoch: 17/951 | step: 4440/6480 | trn_loss: 22.4314 | val_loss: 22.0659
epoch: 17/951 | step: 4455/6480 | trn_loss: 21.3227 | val_loss: 23.0541
epoch: 17/951 | step: 4470/6480 | trn_loss: 22.1549 | val_loss: 24.0291
epoch: 17/951 | step: 4485/6480 | trn_loss: 22.3268 | val_loss: 22.2247
epoch: 17/951 | step: 4500/6480 | trn_loss: 23.1586 | val_loss: 23.4320
epoch: 17/951 | step: 4515/6480 | trn_loss: 22.0931 | val_loss: 23.0672
epoch: 17/951 | step: 4530/6480 | trn_loss: 23.4037 | val_loss: 22.7280
epoch: 17/951 | step: 4545/6480 | trn_loss: 21.9997 | val_loss: 23.1627
epoch: 17/951 | step: 4560/6480 | trn_loss: 21.8399 | val_loss: 22.8442
epoch: 17/951 | step: 4575/6480 | trn_loss: 21.5411 | val_loss: 24.1269
epoch: 17/951 | step: 4590/6480 | trn_loss: 21.5423 | val_loss: 22.8893
epoch: 17/951 | step: 4605/6480 | trn_loss: 21.7932 | val_loss: 

epoch: 17/951 | step: 6105/6480 | trn_loss: 22.0118 | val_loss: 22.9668
epoch: 17/951 | step: 6120/6480 | trn_loss: 23.3462 | val_loss: 24.2500
epoch: 17/951 | step: 6135/6480 | trn_loss: 22.9998 | val_loss: 23.0226
epoch: 17/951 | step: 6150/6480 | trn_loss: 23.0871 | val_loss: 22.6200
epoch: 17/951 | step: 6165/6480 | trn_loss: 22.3826 | val_loss: 22.9450
epoch: 17/951 | step: 6180/6480 | trn_loss: 22.5571 | val_loss: 23.1923
epoch: 17/951 | step: 6195/6480 | trn_loss: 21.6607 | val_loss: 22.6757
epoch: 17/951 | step: 6210/6480 | trn_loss: 21.7594 | val_loss: 22.7895
epoch: 17/951 | step: 6225/6480 | trn_loss: 21.6826 | val_loss: 23.1232
epoch: 17/951 | step: 6240/6480 | trn_loss: 22.8684 | val_loss: 21.7612
epoch: 17/951 | step: 6255/6480 | trn_loss: 22.8634 | val_loss: 23.6984
epoch: 17/951 | step: 6270/6480 | trn_loss: 23.2270 | val_loss: 23.9367
epoch: 17/951 | step: 6285/6480 | trn_loss: 22.0007 | val_loss: 24.2192
epoch: 17/951 | step: 6300/6480 | trn_loss: 22.2219 | val_loss: 

epoch: 18/951 | step: 1335/6480 | trn_loss: 22.1399 | val_loss: 26.4416
epoch: 18/951 | step: 1350/6480 | trn_loss: 21.9694 | val_loss: 23.4671
epoch: 18/951 | step: 1365/6480 | trn_loss: 21.7238 | val_loss: 22.6885
epoch: 18/951 | step: 1380/6480 | trn_loss: 21.8573 | val_loss: 23.3182
epoch: 18/951 | step: 1395/6480 | trn_loss: 21.7417 | val_loss: 21.9599
epoch: 18/951 | step: 1410/6480 | trn_loss: 21.5960 | val_loss: 22.3130
epoch: 18/951 | step: 1425/6480 | trn_loss: 21.9339 | val_loss: 22.6601
epoch: 18/951 | step: 1440/6480 | trn_loss: 22.2051 | val_loss: 23.3906
epoch: 18/951 | step: 1455/6480 | trn_loss: 22.3588 | val_loss: 23.5811
epoch: 18/951 | step: 1470/6480 | trn_loss: 23.2755 | val_loss: 23.8657
epoch: 18/951 | step: 1485/6480 | trn_loss: 22.7281 | val_loss: 23.1553
epoch: 18/951 | step: 1500/6480 | trn_loss: 22.7299 | val_loss: 23.4057
epoch: 18/951 | step: 1515/6480 | trn_loss: 22.1153 | val_loss: 23.5402
epoch: 18/951 | step: 1530/6480 | trn_loss: 21.0531 | val_loss: 

epoch: 18/951 | step: 3030/6480 | trn_loss: 22.4001 | val_loss: 24.5081
epoch: 18/951 | step: 3045/6480 | trn_loss: 21.3609 | val_loss: 22.1057
epoch: 18/951 | step: 3060/6480 | trn_loss: 21.7156 | val_loss: 22.6573
epoch: 18/951 | step: 3075/6480 | trn_loss: 22.5384 | val_loss: 24.0326
epoch: 18/951 | step: 3090/6480 | trn_loss: 21.6602 | val_loss: 22.0532
epoch: 18/951 | step: 3105/6480 | trn_loss: 22.7871 | val_loss: 22.6627
epoch: 18/951 | step: 3120/6480 | trn_loss: 22.3731 | val_loss: 22.6989
epoch: 18/951 | step: 3135/6480 | trn_loss: 21.5551 | val_loss: 23.0353
epoch: 18/951 | step: 3150/6480 | trn_loss: 21.7990 | val_loss: 24.7654
epoch: 18/951 | step: 3165/6480 | trn_loss: 21.4654 | val_loss: 22.9053
epoch: 18/951 | step: 3180/6480 | trn_loss: 21.3164 | val_loss: 22.7348
epoch: 18/951 | step: 3195/6480 | trn_loss: 21.2707 | val_loss: 22.9532
epoch: 18/951 | step: 3210/6480 | trn_loss: 21.8617 | val_loss: 22.6529
epoch: 18/951 | step: 3225/6480 | trn_loss: 22.8266 | val_loss: 

epoch: 18/951 | step: 4725/6480 | trn_loss: 22.3548 | val_loss: 23.6825
epoch: 18/951 | step: 4740/6480 | trn_loss: 21.7636 | val_loss: 23.2296
epoch: 18/951 | step: 4755/6480 | trn_loss: 21.9612 | val_loss: 22.1199
epoch: 18/951 | step: 4770/6480 | trn_loss: 21.8689 | val_loss: 22.9770
epoch: 18/951 | step: 4785/6480 | trn_loss: 22.6633 | val_loss: 24.4881
epoch: 18/951 | step: 4800/6480 | trn_loss: 22.9265 | val_loss: 22.3147
epoch: 18/951 | step: 4815/6480 | trn_loss: 21.8671 | val_loss: 22.5696
epoch: 18/951 | step: 4830/6480 | trn_loss: 21.8346 | val_loss: 22.3265
epoch: 18/951 | step: 4845/6480 | trn_loss: 21.7571 | val_loss: 24.0713
epoch: 18/951 | step: 4860/6480 | trn_loss: 22.0540 | val_loss: 22.7963
epoch: 18/951 | step: 4875/6480 | trn_loss: 21.2539 | val_loss: 23.1156
epoch: 18/951 | step: 4890/6480 | trn_loss: 21.7673 | val_loss: 22.2493
epoch: 18/951 | step: 4905/6480 | trn_loss: 21.9297 | val_loss: 24.4674
epoch: 18/951 | step: 4920/6480 | trn_loss: 21.6516 | val_loss: 

epoch: 18/951 | step: 6420/6480 | trn_loss: 23.0096 | val_loss: 22.3444
epoch: 18/951 | step: 6435/6480 | trn_loss: 22.0580 | val_loss: 22.2018
epoch: 18/951 | step: 6450/6480 | trn_loss: 21.9106 | val_loss: 22.6691
epoch: 18/951 | step: 6465/6480 | trn_loss: 21.4672 | val_loss: 22.0985
epoch: 18/951 | step: 6480/6480 | trn_loss: 22.8834 | val_loss: 21.9535
epoch: 19/951 | step: 15/6480 | trn_loss: 21.6535 | val_loss: 21.8961
epoch: 19/951 | step: 30/6480 | trn_loss: 21.7119 | val_loss: 22.8121
epoch: 19/951 | step: 45/6480 | trn_loss: 21.6698 | val_loss: 22.8564
epoch: 19/951 | step: 60/6480 | trn_loss: 22.4065 | val_loss: 22.2826
epoch: 19/951 | step: 75/6480 | trn_loss: 22.2009 | val_loss: 22.6662
epoch: 19/951 | step: 90/6480 | trn_loss: 21.2097 | val_loss: 22.7652
epoch: 19/951 | step: 105/6480 | trn_loss: 21.3976 | val_loss: 22.8150
epoch: 19/951 | step: 120/6480 | trn_loss: 21.4678 | val_loss: 22.3196
epoch: 19/951 | step: 135/6480 | trn_loss: 21.4770 | val_loss: 21.4917
epoch: 

epoch: 19/951 | step: 1650/6480 | trn_loss: 22.0284 | val_loss: 22.5452
epoch: 19/951 | step: 1665/6480 | trn_loss: 21.6359 | val_loss: 22.2394
epoch: 19/951 | step: 1680/6480 | trn_loss: 22.0779 | val_loss: 22.2292
epoch: 19/951 | step: 1695/6480 | trn_loss: 22.3336 | val_loss: 21.9570
epoch: 19/951 | step: 1710/6480 | trn_loss: 21.9625 | val_loss: 22.6630
epoch: 19/951 | step: 1725/6480 | trn_loss: 21.6102 | val_loss: 23.4284
epoch: 19/951 | step: 1740/6480 | trn_loss: 22.4511 | val_loss: 23.0764
epoch: 19/951 | step: 1755/6480 | trn_loss: 21.5514 | val_loss: 21.9330
epoch: 19/951 | step: 1770/6480 | trn_loss: 21.4649 | val_loss: 22.8075
epoch: 19/951 | step: 1785/6480 | trn_loss: 21.8834 | val_loss: 22.2897
epoch: 19/951 | step: 1800/6480 | trn_loss: 21.9766 | val_loss: 22.4403
epoch: 19/951 | step: 1815/6480 | trn_loss: 22.0093 | val_loss: 23.2121
epoch: 19/951 | step: 1830/6480 | trn_loss: 22.5249 | val_loss: 22.3959
epoch: 19/951 | step: 1845/6480 | trn_loss: 22.1702 | val_loss: 

epoch: 19/951 | step: 3345/6480 | trn_loss: 22.5838 | val_loss: 22.9368
epoch: 19/951 | step: 3360/6480 | trn_loss: 21.5150 | val_loss: 22.1713
epoch: 19/951 | step: 3375/6480 | trn_loss: 21.8250 | val_loss: 22.0315
epoch: 19/951 | step: 3390/6480 | trn_loss: 21.9070 | val_loss: 22.4663
epoch: 19/951 | step: 3405/6480 | trn_loss: 22.4373 | val_loss: 22.0638
epoch: 19/951 | step: 3420/6480 | trn_loss: 21.6369 | val_loss: 23.8408
epoch: 19/951 | step: 3435/6480 | trn_loss: 22.4035 | val_loss: 23.5659
epoch: 19/951 | step: 3450/6480 | trn_loss: 22.2773 | val_loss: 25.9811
epoch: 19/951 | step: 3465/6480 | trn_loss: 21.7229 | val_loss: 22.1620
epoch: 19/951 | step: 3480/6480 | trn_loss: 21.6424 | val_loss: 23.1968
epoch: 19/951 | step: 3495/6480 | trn_loss: 22.9789 | val_loss: 22.2223
epoch: 19/951 | step: 3510/6480 | trn_loss: 21.7019 | val_loss: 23.1673
epoch: 19/951 | step: 3525/6480 | trn_loss: 22.3214 | val_loss: 22.1918
epoch: 19/951 | step: 3540/6480 | trn_loss: 21.5953 | val_loss: 

epoch: 19/951 | step: 5040/6480 | trn_loss: 21.6848 | val_loss: 25.9120
epoch: 19/951 | step: 5055/6480 | trn_loss: 22.0702 | val_loss: 23.9291
epoch: 19/951 | step: 5070/6480 | trn_loss: 22.4513 | val_loss: 22.1478
epoch: 19/951 | step: 5085/6480 | trn_loss: 21.6220 | val_loss: 22.6637
epoch: 19/951 | step: 5100/6480 | trn_loss: 21.7435 | val_loss: 22.9247
epoch: 19/951 | step: 5115/6480 | trn_loss: 22.1113 | val_loss: 21.8771
epoch: 19/951 | step: 5130/6480 | trn_loss: 21.6031 | val_loss: 21.7462
epoch: 19/951 | step: 5145/6480 | trn_loss: 22.3392 | val_loss: 22.4331
epoch: 19/951 | step: 5160/6480 | trn_loss: 21.4666 | val_loss: 23.3121
epoch: 19/951 | step: 5175/6480 | trn_loss: 21.0753 | val_loss: 22.2381
epoch: 19/951 | step: 5190/6480 | trn_loss: 21.3979 | val_loss: 22.5655
epoch: 19/951 | step: 5205/6480 | trn_loss: 21.8152 | val_loss: 23.1612
epoch: 19/951 | step: 5220/6480 | trn_loss: 21.5988 | val_loss: 23.2370
epoch: 19/951 | step: 5235/6480 | trn_loss: 21.8447 | val_loss: 

epoch: 20/951 | step: 270/6480 | trn_loss: 21.2042 | val_loss: 22.3098
epoch: 20/951 | step: 285/6480 | trn_loss: 22.3220 | val_loss: 22.3622
epoch: 20/951 | step: 300/6480 | trn_loss: 21.6525 | val_loss: 22.2659
epoch: 20/951 | step: 315/6480 | trn_loss: 21.2802 | val_loss: 22.8486
epoch: 20/951 | step: 330/6480 | trn_loss: 21.0549 | val_loss: 21.3278
epoch: 20/951 | step: 345/6480 | trn_loss: 21.2641 | val_loss: 21.9819
epoch: 20/951 | step: 360/6480 | trn_loss: 20.5419 | val_loss: 22.8109
epoch: 20/951 | step: 375/6480 | trn_loss: 21.1859 | val_loss: 23.1028
epoch: 20/951 | step: 390/6480 | trn_loss: 21.2226 | val_loss: 23.2678
epoch: 20/951 | step: 405/6480 | trn_loss: 21.7786 | val_loss: 24.0510
epoch: 20/951 | step: 420/6480 | trn_loss: 21.4443 | val_loss: 22.3856
epoch: 20/951 | step: 435/6480 | trn_loss: 21.0162 | val_loss: 22.4874
epoch: 20/951 | step: 450/6480 | trn_loss: 21.9771 | val_loss: 21.6955
epoch: 20/951 | step: 465/6480 | trn_loss: 21.3514 | val_loss: 22.2585
epoch:

epoch: 20/951 | step: 1980/6480 | trn_loss: 21.8254 | val_loss: 23.7244
epoch: 20/951 | step: 1995/6480 | trn_loss: 21.6528 | val_loss: 23.8447
epoch: 20/951 | step: 2010/6480 | trn_loss: 22.1446 | val_loss: 22.1751
epoch: 20/951 | step: 2025/6480 | trn_loss: 21.4101 | val_loss: 22.1146
epoch: 20/951 | step: 2040/6480 | trn_loss: 21.6125 | val_loss: 21.8438
epoch: 20/951 | step: 2055/6480 | trn_loss: 22.0996 | val_loss: 22.2815
epoch: 20/951 | step: 2070/6480 | trn_loss: 22.3765 | val_loss: 22.7624
epoch: 20/951 | step: 2085/6480 | trn_loss: 22.8781 | val_loss: 24.1991
epoch: 20/951 | step: 2100/6480 | trn_loss: 22.2483 | val_loss: 22.8880
epoch: 20/951 | step: 2115/6480 | trn_loss: 21.3085 | val_loss: 21.9314
epoch: 20/951 | step: 2130/6480 | trn_loss: 21.2285 | val_loss: 22.6502
epoch: 20/951 | step: 2145/6480 | trn_loss: 21.8535 | val_loss: 21.7871
epoch: 20/951 | step: 2160/6480 | trn_loss: 21.5307 | val_loss: 22.1361
epoch: 20/951 | step: 2175/6480 | trn_loss: 21.6830 | val_loss: 

epoch: 20/951 | step: 3675/6480 | trn_loss: 21.3915 | val_loss: 22.1382
epoch: 20/951 | step: 3690/6480 | trn_loss: 21.2980 | val_loss: 21.7874
epoch: 20/951 | step: 3705/6480 | trn_loss: 21.4517 | val_loss: 23.3810
epoch: 20/951 | step: 3720/6480 | trn_loss: 21.3910 | val_loss: 23.0064
epoch: 20/951 | step: 3735/6480 | trn_loss: 21.7757 | val_loss: 22.3766
epoch: 20/951 | step: 3750/6480 | trn_loss: 23.1111 | val_loss: 22.7432
epoch: 20/951 | step: 3765/6480 | trn_loss: 21.2809 | val_loss: 22.5588
epoch: 20/951 | step: 3780/6480 | trn_loss: 21.0002 | val_loss: 22.2198
epoch: 20/951 | step: 3795/6480 | trn_loss: 20.9947 | val_loss: 22.8081
epoch: 20/951 | step: 3810/6480 | trn_loss: 21.5239 | val_loss: 22.0237
epoch: 20/951 | step: 3825/6480 | trn_loss: 21.0902 | val_loss: 22.7147
epoch: 20/951 | step: 3840/6480 | trn_loss: 22.7377 | val_loss: 22.1900
epoch: 20/951 | step: 3855/6480 | trn_loss: 21.3180 | val_loss: 24.3442
epoch: 20/951 | step: 3870/6480 | trn_loss: 21.6463 | val_loss: 

epoch: 20/951 | step: 5370/6480 | trn_loss: 21.6698 | val_loss: 22.4547
epoch: 20/951 | step: 5385/6480 | trn_loss: 21.7940 | val_loss: 22.5691
epoch: 20/951 | step: 5400/6480 | trn_loss: 21.6320 | val_loss: 24.1611
epoch: 20/951 | step: 5415/6480 | trn_loss: 21.8492 | val_loss: 22.0918
epoch: 20/951 | step: 5430/6480 | trn_loss: 21.8439 | val_loss: 22.8230
epoch: 20/951 | step: 5445/6480 | trn_loss: 21.4413 | val_loss: 23.7774
epoch: 20/951 | step: 5460/6480 | trn_loss: 21.7841 | val_loss: 22.0105
epoch: 20/951 | step: 5475/6480 | trn_loss: 21.7604 | val_loss: 22.2802
epoch: 20/951 | step: 5490/6480 | trn_loss: 20.9278 | val_loss: 22.4687
epoch: 20/951 | step: 5505/6480 | trn_loss: 20.9797 | val_loss: 23.6262
epoch: 20/951 | step: 5520/6480 | trn_loss: 21.7815 | val_loss: 22.2473
epoch: 20/951 | step: 5535/6480 | trn_loss: 21.9761 | val_loss: 22.8868
epoch: 20/951 | step: 5550/6480 | trn_loss: 21.6650 | val_loss: 22.9641
epoch: 20/951 | step: 5565/6480 | trn_loss: 21.1214 | val_loss: 

epoch: 21/951 | step: 600/6480 | trn_loss: 21.1313 | val_loss: 22.0460
epoch: 21/951 | step: 615/6480 | trn_loss: 21.6347 | val_loss: 25.7538
epoch: 21/951 | step: 630/6480 | trn_loss: 23.2554 | val_loss: 23.0669
epoch: 21/951 | step: 645/6480 | trn_loss: 21.6167 | val_loss: 22.2813
epoch: 21/951 | step: 660/6480 | trn_loss: 21.8151 | val_loss: 23.6238
epoch: 21/951 | step: 675/6480 | trn_loss: 21.2777 | val_loss: 21.5712
epoch: 21/951 | step: 690/6480 | trn_loss: 20.4098 | val_loss: 21.8005
epoch: 21/951 | step: 705/6480 | trn_loss: 20.8348 | val_loss: 22.7790
epoch: 21/951 | step: 720/6480 | trn_loss: 21.1221 | val_loss: 23.2421
epoch: 21/951 | step: 735/6480 | trn_loss: 21.1855 | val_loss: 21.8996
epoch: 21/951 | step: 750/6480 | trn_loss: 21.5782 | val_loss: 21.8590
epoch: 21/951 | step: 765/6480 | trn_loss: 21.6720 | val_loss: 23.9554
epoch: 21/951 | step: 780/6480 | trn_loss: 21.8977 | val_loss: 21.5538
epoch: 21/951 | step: 795/6480 | trn_loss: 21.9383 | val_loss: 21.9572
epoch:

epoch: 21/951 | step: 2310/6480 | trn_loss: 21.7466 | val_loss: 22.7346
epoch: 21/951 | step: 2325/6480 | trn_loss: 21.3856 | val_loss: 22.8678
epoch: 21/951 | step: 2340/6480 | trn_loss: 21.2292 | val_loss: 22.5756
epoch: 21/951 | step: 2355/6480 | trn_loss: 21.3223 | val_loss: 21.9507
epoch: 21/951 | step: 2370/6480 | trn_loss: 20.5901 | val_loss: 21.4072
epoch: 21/951 | step: 2385/6480 | trn_loss: 20.7030 | val_loss: 23.3117
epoch: 21/951 | step: 2400/6480 | trn_loss: 21.7192 | val_loss: 22.5094
epoch: 21/951 | step: 2415/6480 | trn_loss: 20.9162 | val_loss: 22.6460
epoch: 21/951 | step: 2430/6480 | trn_loss: 21.1892 | val_loss: 23.3462
epoch: 21/951 | step: 2445/6480 | trn_loss: 22.5086 | val_loss: 22.6493
epoch: 21/951 | step: 2460/6480 | trn_loss: 22.2287 | val_loss: 22.0798
epoch: 21/951 | step: 2475/6480 | trn_loss: 21.7193 | val_loss: 22.6469
epoch: 21/951 | step: 2490/6480 | trn_loss: 22.8517 | val_loss: 21.9359
epoch: 21/951 | step: 2505/6480 | trn_loss: 21.5127 | val_loss: 

epoch: 21/951 | step: 4005/6480 | trn_loss: 21.8426 | val_loss: 22.7441
epoch: 21/951 | step: 4020/6480 | trn_loss: 21.4874 | val_loss: 22.7992
epoch: 21/951 | step: 4035/6480 | trn_loss: 21.4860 | val_loss: 22.2794
epoch: 21/951 | step: 4050/6480 | trn_loss: 21.7683 | val_loss: 22.5758
epoch: 21/951 | step: 4065/6480 | trn_loss: 22.2481 | val_loss: 23.7742
epoch: 21/951 | step: 4080/6480 | trn_loss: 20.9572 | val_loss: 21.8330
epoch: 21/951 | step: 4095/6480 | trn_loss: 20.8712 | val_loss: 22.7637
epoch: 21/951 | step: 4110/6480 | trn_loss: 21.6435 | val_loss: 22.5190
epoch: 21/951 | step: 4125/6480 | trn_loss: 22.0552 | val_loss: 21.6564
epoch: 21/951 | step: 4140/6480 | trn_loss: 21.9764 | val_loss: 22.3996
epoch: 21/951 | step: 4155/6480 | trn_loss: 21.3105 | val_loss: 23.0705
epoch: 21/951 | step: 4170/6480 | trn_loss: 21.2464 | val_loss: 22.0623
epoch: 21/951 | step: 4185/6480 | trn_loss: 22.5476 | val_loss: 21.6783
epoch: 21/951 | step: 4200/6480 | trn_loss: 21.7972 | val_loss: 

epoch: 21/951 | step: 5700/6480 | trn_loss: 21.2050 | val_loss: 21.6872
epoch: 21/951 | step: 5715/6480 | trn_loss: 21.1277 | val_loss: 22.2883
epoch: 21/951 | step: 5730/6480 | trn_loss: 21.8463 | val_loss: 22.4339
epoch: 21/951 | step: 5745/6480 | trn_loss: 20.9619 | val_loss: 21.1874
epoch: 21/951 | step: 5760/6480 | trn_loss: 20.8246 | val_loss: 23.1117
epoch: 21/951 | step: 5775/6480 | trn_loss: 21.8100 | val_loss: 22.8669
epoch: 21/951 | step: 5790/6480 | trn_loss: 20.4760 | val_loss: 21.7335
epoch: 21/951 | step: 5805/6480 | trn_loss: 21.7891 | val_loss: 22.5374
epoch: 21/951 | step: 5820/6480 | trn_loss: 20.7875 | val_loss: 21.3335
epoch: 21/951 | step: 5835/6480 | trn_loss: 20.9945 | val_loss: 23.5553
epoch: 21/951 | step: 5850/6480 | trn_loss: 20.9182 | val_loss: 21.9536
epoch: 21/951 | step: 5865/6480 | trn_loss: 20.9056 | val_loss: 22.4082
epoch: 21/951 | step: 5880/6480 | trn_loss: 21.5175 | val_loss: 22.8705
epoch: 21/951 | step: 5895/6480 | trn_loss: 20.6886 | val_loss: 

epoch: 22/951 | step: 930/6480 | trn_loss: 21.6175 | val_loss: 22.0702
epoch: 22/951 | step: 945/6480 | trn_loss: 21.0986 | val_loss: 23.4050
epoch: 22/951 | step: 960/6480 | trn_loss: 21.2871 | val_loss: 21.3273
epoch: 22/951 | step: 975/6480 | trn_loss: 20.6301 | val_loss: 23.3201
epoch: 22/951 | step: 990/6480 | trn_loss: 21.1968 | val_loss: 22.3505
epoch: 22/951 | step: 1005/6480 | trn_loss: 20.3380 | val_loss: 21.8803
epoch: 22/951 | step: 1020/6480 | trn_loss: 20.2725 | val_loss: 22.5988
epoch: 22/951 | step: 1035/6480 | trn_loss: 21.8092 | val_loss: 22.0983
epoch: 22/951 | step: 1050/6480 | trn_loss: 20.3938 | val_loss: 22.7584
epoch: 22/951 | step: 1065/6480 | trn_loss: 21.7304 | val_loss: 21.9678
epoch: 22/951 | step: 1080/6480 | trn_loss: 20.9114 | val_loss: 21.8577
epoch: 22/951 | step: 1095/6480 | trn_loss: 21.6882 | val_loss: 22.8656
epoch: 22/951 | step: 1110/6480 | trn_loss: 21.8493 | val_loss: 22.0262
epoch: 22/951 | step: 1125/6480 | trn_loss: 20.6583 | val_loss: 22.04

epoch: 22/951 | step: 2625/6480 | trn_loss: 21.2952 | val_loss: 22.2041
epoch: 22/951 | step: 2640/6480 | trn_loss: 20.9919 | val_loss: 22.1130
epoch: 22/951 | step: 2655/6480 | trn_loss: 20.6058 | val_loss: 23.2882
epoch: 22/951 | step: 2670/6480 | trn_loss: 21.1409 | val_loss: 21.9698
epoch: 22/951 | step: 2685/6480 | trn_loss: 20.7504 | val_loss: 22.2518
epoch: 22/951 | step: 2700/6480 | trn_loss: 20.9848 | val_loss: 21.5510
epoch: 22/951 | step: 2715/6480 | trn_loss: 21.5591 | val_loss: 22.2718
epoch: 22/951 | step: 2730/6480 | trn_loss: 21.1963 | val_loss: 22.1654
epoch: 22/951 | step: 2745/6480 | trn_loss: 20.8017 | val_loss: 21.9798
epoch: 22/951 | step: 2760/6480 | trn_loss: 21.1769 | val_loss: 22.9132
epoch: 22/951 | step: 2775/6480 | trn_loss: 21.2553 | val_loss: 21.7456
epoch: 22/951 | step: 2790/6480 | trn_loss: 22.0991 | val_loss: 21.3576
epoch: 22/951 | step: 2805/6480 | trn_loss: 22.0852 | val_loss: 26.1256
epoch: 22/951 | step: 2820/6480 | trn_loss: 21.4994 | val_loss: 

epoch: 22/951 | step: 4320/6480 | trn_loss: 21.1327 | val_loss: 21.7907
epoch: 22/951 | step: 4335/6480 | trn_loss: 20.7645 | val_loss: 21.2483
epoch: 22/951 | step: 4350/6480 | trn_loss: 21.1520 | val_loss: 21.9826
epoch: 22/951 | step: 4365/6480 | trn_loss: 21.0827 | val_loss: 22.3689
epoch: 22/951 | step: 4380/6480 | trn_loss: 22.2757 | val_loss: 22.5706
epoch: 22/951 | step: 4395/6480 | trn_loss: 21.4195 | val_loss: 22.9520
epoch: 22/951 | step: 4410/6480 | trn_loss: 21.1921 | val_loss: 21.3086
epoch: 22/951 | step: 4425/6480 | trn_loss: 21.0199 | val_loss: 22.4489
epoch: 22/951 | step: 4440/6480 | trn_loss: 21.2473 | val_loss: 21.1942
epoch: 22/951 | step: 4455/6480 | trn_loss: 21.8938 | val_loss: 22.1384
epoch: 22/951 | step: 4470/6480 | trn_loss: 22.1417 | val_loss: 23.2638
epoch: 22/951 | step: 4485/6480 | trn_loss: 21.5345 | val_loss: 21.8477
epoch: 22/951 | step: 4500/6480 | trn_loss: 20.9503 | val_loss: 22.1318
epoch: 22/951 | step: 4515/6480 | trn_loss: 21.7762 | val_loss: 

epoch: 22/951 | step: 6015/6480 | trn_loss: 20.8898 | val_loss: 22.1882
epoch: 22/951 | step: 6030/6480 | trn_loss: 22.5267 | val_loss: 23.1228
epoch: 22/951 | step: 6045/6480 | trn_loss: 21.5152 | val_loss: 22.3306
epoch: 22/951 | step: 6060/6480 | trn_loss: 21.6377 | val_loss: 22.2661
epoch: 22/951 | step: 6075/6480 | trn_loss: 20.5275 | val_loss: 22.9771
epoch: 22/951 | step: 6090/6480 | trn_loss: 21.7283 | val_loss: 22.0342
epoch: 22/951 | step: 6105/6480 | trn_loss: 21.3680 | val_loss: 21.6317
epoch: 22/951 | step: 6120/6480 | trn_loss: 20.8339 | val_loss: 22.5854
epoch: 22/951 | step: 6135/6480 | trn_loss: 21.0955 | val_loss: 21.7617
epoch: 22/951 | step: 6150/6480 | trn_loss: 21.4105 | val_loss: 21.5038
epoch: 22/951 | step: 6165/6480 | trn_loss: 21.1452 | val_loss: 23.0943
epoch: 22/951 | step: 6180/6480 | trn_loss: 21.5102 | val_loss: 22.0797
epoch: 22/951 | step: 6195/6480 | trn_loss: 20.5911 | val_loss: 21.7249
epoch: 22/951 | step: 6210/6480 | trn_loss: 21.3793 | val_loss: 

epoch: 23/951 | step: 1245/6480 | trn_loss: 22.0886 | val_loss: 22.8575
epoch: 23/951 | step: 1260/6480 | trn_loss: 21.6067 | val_loss: 22.4652
epoch: 23/951 | step: 1275/6480 | trn_loss: 21.4504 | val_loss: 22.3135
epoch: 23/951 | step: 1290/6480 | trn_loss: 20.7245 | val_loss: 21.6162
epoch: 23/951 | step: 1305/6480 | trn_loss: 22.0313 | val_loss: 23.3352
epoch: 23/951 | step: 1320/6480 | trn_loss: 21.3088 | val_loss: 21.7704
epoch: 23/951 | step: 1335/6480 | trn_loss: 20.9664 | val_loss: 23.0332
epoch: 23/951 | step: 1350/6480 | trn_loss: 20.8403 | val_loss: 21.8567
epoch: 23/951 | step: 1365/6480 | trn_loss: 20.6244 | val_loss: 22.1578
epoch: 23/951 | step: 1380/6480 | trn_loss: 20.8454 | val_loss: 21.1171
epoch: 23/951 | step: 1395/6480 | trn_loss: 21.5732 | val_loss: 21.7776
epoch: 23/951 | step: 1410/6480 | trn_loss: 20.8923 | val_loss: 23.5507
epoch: 23/951 | step: 1425/6480 | trn_loss: 20.9334 | val_loss: 24.1130
epoch: 23/951 | step: 1440/6480 | trn_loss: 21.9234 | val_loss: 

epoch: 23/951 | step: 2940/6480 | trn_loss: 20.7032 | val_loss: 22.0169
epoch: 23/951 | step: 2955/6480 | trn_loss: 20.7948 | val_loss: 22.7293
epoch: 23/951 | step: 2970/6480 | trn_loss: 20.6104 | val_loss: 21.5553
epoch: 23/951 | step: 2985/6480 | trn_loss: 20.6636 | val_loss: 21.9527
epoch: 23/951 | step: 3000/6480 | trn_loss: 20.6215 | val_loss: 22.5317
epoch: 23/951 | step: 3015/6480 | trn_loss: 22.7674 | val_loss: 22.5774
epoch: 23/951 | step: 3030/6480 | trn_loss: 20.7946 | val_loss: 22.6319
epoch: 23/951 | step: 3045/6480 | trn_loss: 21.0643 | val_loss: 22.6172
epoch: 23/951 | step: 3060/6480 | trn_loss: 20.8839 | val_loss: 21.7493
epoch: 23/951 | step: 3075/6480 | trn_loss: 20.7725 | val_loss: 22.3358
epoch: 23/951 | step: 3090/6480 | trn_loss: 21.1848 | val_loss: 22.1855
epoch: 23/951 | step: 3105/6480 | trn_loss: 20.7300 | val_loss: 22.3104
epoch: 23/951 | step: 3120/6480 | trn_loss: 20.7969 | val_loss: 22.5785
epoch: 23/951 | step: 3135/6480 | trn_loss: 21.4467 | val_loss: 

epoch: 23/951 | step: 4635/6480 | trn_loss: 21.5137 | val_loss: 21.2068
epoch: 23/951 | step: 4650/6480 | trn_loss: 20.6757 | val_loss: 21.5572
epoch: 23/951 | step: 4665/6480 | trn_loss: 20.7443 | val_loss: 22.0048
epoch: 23/951 | step: 4680/6480 | trn_loss: 20.9364 | val_loss: 21.6117
epoch: 23/951 | step: 4695/6480 | trn_loss: 21.2005 | val_loss: 23.8431
epoch: 23/951 | step: 4710/6480 | trn_loss: 20.6716 | val_loss: 21.7841
epoch: 23/951 | step: 4725/6480 | trn_loss: 20.6567 | val_loss: 21.5580
epoch: 23/951 | step: 4740/6480 | trn_loss: 20.8286 | val_loss: 22.8001
epoch: 23/951 | step: 4755/6480 | trn_loss: 21.8732 | val_loss: 21.1630
epoch: 23/951 | step: 4770/6480 | trn_loss: 20.9376 | val_loss: 21.1816
epoch: 23/951 | step: 4785/6480 | trn_loss: 21.2463 | val_loss: 22.3439
epoch: 23/951 | step: 4800/6480 | trn_loss: 21.3439 | val_loss: 21.0941
epoch: 23/951 | step: 4815/6480 | trn_loss: 22.0263 | val_loss: 22.5822
epoch: 23/951 | step: 4830/6480 | trn_loss: 21.0637 | val_loss: 

epoch: 23/951 | step: 6330/6480 | trn_loss: 20.9088 | val_loss: 21.1085
epoch: 23/951 | step: 6345/6480 | trn_loss: 20.9509 | val_loss: 22.2220
epoch: 23/951 | step: 6360/6480 | trn_loss: 21.2993 | val_loss: 22.9712
epoch: 23/951 | step: 6375/6480 | trn_loss: 20.9788 | val_loss: 21.9037
epoch: 23/951 | step: 6390/6480 | trn_loss: 21.1241 | val_loss: 22.0716
epoch: 23/951 | step: 6405/6480 | trn_loss: 20.8675 | val_loss: 21.4465
epoch: 23/951 | step: 6420/6480 | trn_loss: 20.4832 | val_loss: 22.4118
epoch: 23/951 | step: 6435/6480 | trn_loss: 21.6580 | val_loss: 21.6617
epoch: 23/951 | step: 6450/6480 | trn_loss: 21.1812 | val_loss: 22.5000
epoch: 23/951 | step: 6465/6480 | trn_loss: 21.6171 | val_loss: 22.4937
epoch: 23/951 | step: 6480/6480 | trn_loss: 21.4771 | val_loss: 22.2132
epoch: 24/951 | step: 15/6480 | trn_loss: 23.3905 | val_loss: 22.9834
epoch: 24/951 | step: 30/6480 | trn_loss: 21.4558 | val_loss: 21.5899
epoch: 24/951 | step: 45/6480 | trn_loss: 21.0585 | val_loss: 22.065

epoch: 24/951 | step: 1560/6480 | trn_loss: 20.8918 | val_loss: 23.3439
epoch: 24/951 | step: 1575/6480 | trn_loss: 21.4493 | val_loss: 23.6986
epoch: 24/951 | step: 1590/6480 | trn_loss: 21.3395 | val_loss: 21.6934
epoch: 24/951 | step: 1605/6480 | trn_loss: 20.2852 | val_loss: 21.9946
epoch: 24/951 | step: 1620/6480 | trn_loss: 20.7783 | val_loss: 21.4216
epoch: 24/951 | step: 1635/6480 | trn_loss: 21.0113 | val_loss: 22.2155
epoch: 24/951 | step: 1650/6480 | trn_loss: 20.6255 | val_loss: 22.3655
epoch: 24/951 | step: 1665/6480 | trn_loss: 21.1603 | val_loss: 22.2912
epoch: 24/951 | step: 1680/6480 | trn_loss: 21.0173 | val_loss: 22.1232
epoch: 24/951 | step: 1695/6480 | trn_loss: 21.2948 | val_loss: 21.4698
epoch: 24/951 | step: 1710/6480 | trn_loss: 20.5326 | val_loss: 21.2033
epoch: 24/951 | step: 1725/6480 | trn_loss: 20.1870 | val_loss: 22.2991
epoch: 24/951 | step: 1740/6480 | trn_loss: 20.0002 | val_loss: 21.8120
epoch: 24/951 | step: 1755/6480 | trn_loss: 21.6419 | val_loss: 

epoch: 24/951 | step: 3255/6480 | trn_loss: 21.4871 | val_loss: 22.7725
epoch: 24/951 | step: 3270/6480 | trn_loss: 21.0676 | val_loss: 22.2302
epoch: 24/951 | step: 3285/6480 | trn_loss: 20.9620 | val_loss: 21.0109
epoch: 24/951 | step: 3300/6480 | trn_loss: 20.9849 | val_loss: 22.4509
epoch: 24/951 | step: 3315/6480 | trn_loss: 21.0522 | val_loss: 22.0541
epoch: 24/951 | step: 3330/6480 | trn_loss: 20.8524 | val_loss: 24.4950
epoch: 24/951 | step: 3345/6480 | trn_loss: 20.6961 | val_loss: 21.3978
epoch: 24/951 | step: 3360/6480 | trn_loss: 21.1160 | val_loss: 22.1258
epoch: 24/951 | step: 3375/6480 | trn_loss: 20.7189 | val_loss: 22.3976
epoch: 24/951 | step: 3390/6480 | trn_loss: 21.1383 | val_loss: 21.7864
epoch: 24/951 | step: 3405/6480 | trn_loss: 21.4180 | val_loss: 25.8453
epoch: 24/951 | step: 3420/6480 | trn_loss: 21.1442 | val_loss: 21.2723
epoch: 24/951 | step: 3435/6480 | trn_loss: 20.1544 | val_loss: 22.6114
epoch: 24/951 | step: 3450/6480 | trn_loss: 20.9946 | val_loss: 

epoch: 24/951 | step: 4950/6480 | trn_loss: 21.0894 | val_loss: 21.9408
epoch: 24/951 | step: 4965/6480 | trn_loss: 20.1199 | val_loss: 21.9454
epoch: 24/951 | step: 4980/6480 | trn_loss: 22.0235 | val_loss: 21.4324
epoch: 24/951 | step: 4995/6480 | trn_loss: 21.4312 | val_loss: 22.6615
epoch: 24/951 | step: 5010/6480 | trn_loss: 22.0071 | val_loss: 22.3942
epoch: 24/951 | step: 5025/6480 | trn_loss: 20.7662 | val_loss: 21.1091
epoch: 24/951 | step: 5040/6480 | trn_loss: 21.3646 | val_loss: 21.9868
epoch: 24/951 | step: 5055/6480 | trn_loss: 20.4868 | val_loss: 21.8673
epoch: 24/951 | step: 5070/6480 | trn_loss: 22.6616 | val_loss: 22.0355
epoch: 24/951 | step: 5085/6480 | trn_loss: 21.1691 | val_loss: 21.8248
epoch: 24/951 | step: 5100/6480 | trn_loss: 20.6128 | val_loss: 22.6175
epoch: 24/951 | step: 5115/6480 | trn_loss: 20.5806 | val_loss: 21.4116
epoch: 24/951 | step: 5130/6480 | trn_loss: 21.1482 | val_loss: 22.6138
epoch: 24/951 | step: 5145/6480 | trn_loss: 21.6419 | val_loss: 

epoch: 25/951 | step: 180/6480 | trn_loss: 21.3768 | val_loss: 20.7353
epoch: 25/951 | step: 195/6480 | trn_loss: 20.8624 | val_loss: 20.9846
epoch: 25/951 | step: 210/6480 | trn_loss: 20.9408 | val_loss: 22.2304
epoch: 25/951 | step: 225/6480 | trn_loss: 20.7541 | val_loss: 21.5364
epoch: 25/951 | step: 240/6480 | trn_loss: 20.6508 | val_loss: 22.4173
epoch: 25/951 | step: 255/6480 | trn_loss: 20.9845 | val_loss: 21.9253
epoch: 25/951 | step: 270/6480 | trn_loss: 20.6775 | val_loss: 21.9143
epoch: 25/951 | step: 285/6480 | trn_loss: 21.1929 | val_loss: 22.1270
epoch: 25/951 | step: 300/6480 | trn_loss: 20.9471 | val_loss: 21.2662
epoch: 25/951 | step: 315/6480 | trn_loss: 21.0506 | val_loss: 21.7229
epoch: 25/951 | step: 330/6480 | trn_loss: 21.2808 | val_loss: 23.9894
epoch: 25/951 | step: 345/6480 | trn_loss: 21.2639 | val_loss: 21.2628
epoch: 25/951 | step: 360/6480 | trn_loss: 20.5561 | val_loss: 21.4085
epoch: 25/951 | step: 375/6480 | trn_loss: 20.7148 | val_loss: 21.4844
epoch:

epoch: 25/951 | step: 1890/6480 | trn_loss: 21.2709 | val_loss: 21.0760
epoch: 25/951 | step: 1905/6480 | trn_loss: 20.5829 | val_loss: 21.4055
epoch: 25/951 | step: 1920/6480 | trn_loss: 21.8964 | val_loss: 22.4339
epoch: 25/951 | step: 1935/6480 | trn_loss: 21.2548 | val_loss: 23.0488
epoch: 25/951 | step: 1950/6480 | trn_loss: 21.2763 | val_loss: 21.9967
epoch: 25/951 | step: 1965/6480 | trn_loss: 20.6037 | val_loss: 22.5173
epoch: 25/951 | step: 1980/6480 | trn_loss: 20.8762 | val_loss: 21.8009
epoch: 25/951 | step: 1995/6480 | trn_loss: 20.6134 | val_loss: 22.6384
epoch: 25/951 | step: 2010/6480 | trn_loss: 21.0825 | val_loss: 20.7352
epoch: 25/951 | step: 2025/6480 | trn_loss: 21.2269 | val_loss: 21.9029
epoch: 25/951 | step: 2040/6480 | trn_loss: 20.6947 | val_loss: 21.2438
epoch: 25/951 | step: 2055/6480 | trn_loss: 20.8737 | val_loss: 21.9088
epoch: 25/951 | step: 2070/6480 | trn_loss: 20.5869 | val_loss: 21.5197
epoch: 25/951 | step: 2085/6480 | trn_loss: 20.3220 | val_loss: 

epoch: 25/951 | step: 3585/6480 | trn_loss: 21.1810 | val_loss: 22.1202
epoch: 25/951 | step: 3600/6480 | trn_loss: 20.9066 | val_loss: 20.9429
epoch: 25/951 | step: 3615/6480 | trn_loss: 20.7351 | val_loss: 20.8384
epoch: 25/951 | step: 3630/6480 | trn_loss: 20.3340 | val_loss: 21.3253
epoch: 25/951 | step: 3645/6480 | trn_loss: 21.4448 | val_loss: 21.1533
epoch: 25/951 | step: 3660/6480 | trn_loss: 21.5348 | val_loss: 23.1979
epoch: 25/951 | step: 3675/6480 | trn_loss: 20.9301 | val_loss: 21.5614
epoch: 25/951 | step: 3690/6480 | trn_loss: 20.0222 | val_loss: 21.2476
epoch: 25/951 | step: 3705/6480 | trn_loss: 20.3696 | val_loss: 21.2936
epoch: 25/951 | step: 3720/6480 | trn_loss: 21.7645 | val_loss: 22.8242
epoch: 25/951 | step: 3735/6480 | trn_loss: 20.8697 | val_loss: 20.9156
epoch: 25/951 | step: 3750/6480 | trn_loss: 20.4621 | val_loss: 21.7498
epoch: 25/951 | step: 3765/6480 | trn_loss: 20.9225 | val_loss: 21.3807
epoch: 25/951 | step: 3780/6480 | trn_loss: 21.4335 | val_loss: 

epoch: 25/951 | step: 5280/6480 | trn_loss: 21.4833 | val_loss: 21.3463
epoch: 25/951 | step: 5295/6480 | trn_loss: 20.4364 | val_loss: 21.2106
epoch: 25/951 | step: 5310/6480 | trn_loss: 20.6722 | val_loss: 21.2717
epoch: 25/951 | step: 5325/6480 | trn_loss: 22.2750 | val_loss: 22.9679
epoch: 25/951 | step: 5340/6480 | trn_loss: 20.6657 | val_loss: 22.0932
epoch: 25/951 | step: 5355/6480 | trn_loss: 21.3453 | val_loss: 20.5138
epoch: 25/951 | step: 5370/6480 | trn_loss: 20.8234 | val_loss: 22.5662
epoch: 25/951 | step: 5385/6480 | trn_loss: 23.0864 | val_loss: 22.6491
epoch: 25/951 | step: 5400/6480 | trn_loss: 22.8486 | val_loss: 21.6240
epoch: 25/951 | step: 5415/6480 | trn_loss: 20.5774 | val_loss: 21.4836
epoch: 25/951 | step: 5430/6480 | trn_loss: 20.4688 | val_loss: 21.6084
epoch: 25/951 | step: 5445/6480 | trn_loss: 20.5209 | val_loss: 21.2297
epoch: 25/951 | step: 5460/6480 | trn_loss: 20.3992 | val_loss: 21.5778
epoch: 25/951 | step: 5475/6480 | trn_loss: 21.0657 | val_loss: 

epoch: 26/951 | step: 510/6480 | trn_loss: 20.8641 | val_loss: 23.3815
epoch: 26/951 | step: 525/6480 | trn_loss: 21.0636 | val_loss: 23.2498
epoch: 26/951 | step: 540/6480 | trn_loss: 20.7665 | val_loss: 21.4346
epoch: 26/951 | step: 555/6480 | trn_loss: 20.9173 | val_loss: 21.8856
epoch: 26/951 | step: 570/6480 | trn_loss: 20.9390 | val_loss: 21.4419
epoch: 26/951 | step: 585/6480 | trn_loss: 20.6518 | val_loss: 20.9451
epoch: 26/951 | step: 600/6480 | trn_loss: 20.3387 | val_loss: 21.9228
epoch: 26/951 | step: 615/6480 | trn_loss: 20.9823 | val_loss: 22.6685
epoch: 26/951 | step: 630/6480 | trn_loss: 20.6849 | val_loss: 21.0779
epoch: 26/951 | step: 645/6480 | trn_loss: 21.2038 | val_loss: 22.7350
epoch: 26/951 | step: 660/6480 | trn_loss: 20.7862 | val_loss: 21.3433
epoch: 26/951 | step: 675/6480 | trn_loss: 20.7011 | val_loss: 21.0759
epoch: 26/951 | step: 690/6480 | trn_loss: 20.4192 | val_loss: 21.5342
epoch: 26/951 | step: 705/6480 | trn_loss: 20.3476 | val_loss: 21.0962
epoch:

epoch: 26/951 | step: 2220/6480 | trn_loss: 20.1496 | val_loss: 21.0868
epoch: 26/951 | step: 2235/6480 | trn_loss: 20.3752 | val_loss: 21.9921
epoch: 26/951 | step: 2250/6480 | trn_loss: 20.5102 | val_loss: 21.6717
epoch: 26/951 | step: 2265/6480 | trn_loss: 19.9239 | val_loss: 20.1204
epoch: 26/951 | step: 2280/6480 | trn_loss: 22.4013 | val_loss: 22.4232
epoch: 26/951 | step: 2295/6480 | trn_loss: 20.8987 | val_loss: 21.2767
epoch: 26/951 | step: 2310/6480 | trn_loss: 20.9417 | val_loss: 21.5519
epoch: 26/951 | step: 2325/6480 | trn_loss: 20.9473 | val_loss: 21.8148
epoch: 26/951 | step: 2340/6480 | trn_loss: 20.8338 | val_loss: 21.9780
epoch: 26/951 | step: 2355/6480 | trn_loss: 20.7172 | val_loss: 22.6412
epoch: 26/951 | step: 2370/6480 | trn_loss: 20.3835 | val_loss: 20.9556
epoch: 26/951 | step: 2385/6480 | trn_loss: 20.7667 | val_loss: 22.5404
epoch: 26/951 | step: 2400/6480 | trn_loss: 21.5051 | val_loss: 22.6286
epoch: 26/951 | step: 2415/6480 | trn_loss: 20.8321 | val_loss: 

epoch: 26/951 | step: 3915/6480 | trn_loss: 20.5098 | val_loss: 21.3402
epoch: 26/951 | step: 3930/6480 | trn_loss: 19.8722 | val_loss: 23.3099
epoch: 26/951 | step: 3945/6480 | trn_loss: 20.7336 | val_loss: 22.1309
epoch: 26/951 | step: 3960/6480 | trn_loss: 20.8702 | val_loss: 21.5849
epoch: 26/951 | step: 3975/6480 | trn_loss: 20.3486 | val_loss: 22.7022
epoch: 26/951 | step: 3990/6480 | trn_loss: 20.3229 | val_loss: 20.6954
epoch: 26/951 | step: 4005/6480 | trn_loss: 20.3361 | val_loss: 21.1989
epoch: 26/951 | step: 4020/6480 | trn_loss: 20.1489 | val_loss: 21.6225
epoch: 26/951 | step: 4035/6480 | trn_loss: 20.7622 | val_loss: 21.2646
epoch: 26/951 | step: 4050/6480 | trn_loss: 20.8156 | val_loss: 23.0537
epoch: 26/951 | step: 4065/6480 | trn_loss: 20.7117 | val_loss: 20.9906
epoch: 26/951 | step: 4080/6480 | trn_loss: 20.1799 | val_loss: 21.7268
epoch: 26/951 | step: 4095/6480 | trn_loss: 20.6795 | val_loss: 21.9463
epoch: 26/951 | step: 4110/6480 | trn_loss: 19.6808 | val_loss: 

epoch: 26/951 | step: 5610/6480 | trn_loss: 21.5791 | val_loss: 21.7348
epoch: 26/951 | step: 5625/6480 | trn_loss: 19.8737 | val_loss: 22.1112
epoch: 26/951 | step: 5640/6480 | trn_loss: 20.1087 | val_loss: 22.0912
epoch: 26/951 | step: 5655/6480 | trn_loss: 20.7564 | val_loss: 22.1541
epoch: 26/951 | step: 5670/6480 | trn_loss: 20.5196 | val_loss: 22.2988
epoch: 26/951 | step: 5685/6480 | trn_loss: 20.5484 | val_loss: 21.0859
epoch: 26/951 | step: 5700/6480 | trn_loss: 21.1475 | val_loss: 22.1053
epoch: 26/951 | step: 5715/6480 | trn_loss: 20.6181 | val_loss: 22.0406
epoch: 26/951 | step: 5730/6480 | trn_loss: 20.3926 | val_loss: 21.0095
epoch: 26/951 | step: 5745/6480 | trn_loss: 20.1818 | val_loss: 21.8939
epoch: 26/951 | step: 5760/6480 | trn_loss: 20.2338 | val_loss: 21.5874
epoch: 26/951 | step: 5775/6480 | trn_loss: 20.7681 | val_loss: 21.9471
epoch: 26/951 | step: 5790/6480 | trn_loss: 20.4959 | val_loss: 20.9632
epoch: 26/951 | step: 5805/6480 | trn_loss: 21.2951 | val_loss: 

epoch: 27/951 | step: 840/6480 | trn_loss: 20.6475 | val_loss: 22.3506
epoch: 27/951 | step: 855/6480 | trn_loss: 21.4023 | val_loss: 21.9830
epoch: 27/951 | step: 870/6480 | trn_loss: 20.2622 | val_loss: 21.5519
epoch: 27/951 | step: 885/6480 | trn_loss: 21.1630 | val_loss: 21.3471
epoch: 27/951 | step: 900/6480 | trn_loss: 19.8772 | val_loss: 20.6511
epoch: 27/951 | step: 915/6480 | trn_loss: 20.9486 | val_loss: 21.6003
epoch: 27/951 | step: 930/6480 | trn_loss: 21.3779 | val_loss: 21.6856
epoch: 27/951 | step: 945/6480 | trn_loss: 20.3983 | val_loss: 20.4426
epoch: 27/951 | step: 960/6480 | trn_loss: 20.4342 | val_loss: 21.2833
epoch: 27/951 | step: 975/6480 | trn_loss: 20.1517 | val_loss: 21.9528
epoch: 27/951 | step: 990/6480 | trn_loss: 21.5082 | val_loss: 21.6778
epoch: 27/951 | step: 1005/6480 | trn_loss: 21.2299 | val_loss: 22.2404
epoch: 27/951 | step: 1020/6480 | trn_loss: 20.5070 | val_loss: 21.5200
epoch: 27/951 | step: 1035/6480 | trn_loss: 20.4824 | val_loss: 22.6277
epo

epoch: 27/951 | step: 2535/6480 | trn_loss: 20.3308 | val_loss: 21.7269
epoch: 27/951 | step: 2550/6480 | trn_loss: 20.4959 | val_loss: 21.0725
epoch: 27/951 | step: 2565/6480 | trn_loss: 23.2454 | val_loss: 22.2072
epoch: 27/951 | step: 2580/6480 | trn_loss: 21.1356 | val_loss: 20.9840
epoch: 27/951 | step: 2595/6480 | trn_loss: 20.1034 | val_loss: 22.6099
epoch: 27/951 | step: 2610/6480 | trn_loss: 20.1751 | val_loss: 21.0684
epoch: 27/951 | step: 2625/6480 | trn_loss: 19.7243 | val_loss: 21.2225
epoch: 27/951 | step: 2640/6480 | trn_loss: 20.2160 | val_loss: 21.9484
epoch: 27/951 | step: 2655/6480 | trn_loss: 20.0601 | val_loss: 21.8222
epoch: 27/951 | step: 2670/6480 | trn_loss: 20.1376 | val_loss: 21.5577
epoch: 27/951 | step: 2685/6480 | trn_loss: 20.2212 | val_loss: 21.8133
epoch: 27/951 | step: 2700/6480 | trn_loss: 20.4167 | val_loss: 21.2578
epoch: 27/951 | step: 2715/6480 | trn_loss: 20.1688 | val_loss: 21.7270
epoch: 27/951 | step: 2730/6480 | trn_loss: 20.0472 | val_loss: 

epoch: 27/951 | step: 4230/6480 | trn_loss: 20.4761 | val_loss: 21.9504
epoch: 27/951 | step: 4245/6480 | trn_loss: 20.2114 | val_loss: 21.3982
epoch: 27/951 | step: 4260/6480 | trn_loss: 20.7497 | val_loss: 22.0146
epoch: 27/951 | step: 4275/6480 | trn_loss: 20.5471 | val_loss: 21.3225
epoch: 27/951 | step: 4290/6480 | trn_loss: 20.4323 | val_loss: 20.2768
epoch: 27/951 | step: 4305/6480 | trn_loss: 19.9903 | val_loss: 22.5599
epoch: 27/951 | step: 4320/6480 | trn_loss: 20.7289 | val_loss: 22.1430
epoch: 27/951 | step: 4335/6480 | trn_loss: 21.1716 | val_loss: 21.9245
epoch: 27/951 | step: 4350/6480 | trn_loss: 20.3912 | val_loss: 21.8245
epoch: 27/951 | step: 4365/6480 | trn_loss: 20.2843 | val_loss: 21.7398
epoch: 27/951 | step: 4380/6480 | trn_loss: 20.5868 | val_loss: 21.5937
epoch: 27/951 | step: 4395/6480 | trn_loss: 20.9995 | val_loss: 21.9719
epoch: 27/951 | step: 4410/6480 | trn_loss: 20.4919 | val_loss: 21.0059
epoch: 27/951 | step: 4425/6480 | trn_loss: 21.1535 | val_loss: 

epoch: 27/951 | step: 5925/6480 | trn_loss: 21.0588 | val_loss: 21.8729
epoch: 27/951 | step: 5940/6480 | trn_loss: 21.4280 | val_loss: 22.3454
epoch: 27/951 | step: 5955/6480 | trn_loss: 19.9672 | val_loss: 21.5757
epoch: 27/951 | step: 5970/6480 | trn_loss: 20.6303 | val_loss: 21.3950
epoch: 27/951 | step: 5985/6480 | trn_loss: 20.3844 | val_loss: 22.0650
epoch: 27/951 | step: 6000/6480 | trn_loss: 20.3859 | val_loss: 21.1953
epoch: 27/951 | step: 6015/6480 | trn_loss: 20.1759 | val_loss: 20.8903
epoch: 27/951 | step: 6030/6480 | trn_loss: 20.2339 | val_loss: 21.0689
epoch: 27/951 | step: 6045/6480 | trn_loss: 20.5505 | val_loss: 21.4318
epoch: 27/951 | step: 6060/6480 | trn_loss: 20.3355 | val_loss: 22.1714
epoch: 27/951 | step: 6075/6480 | trn_loss: 21.4899 | val_loss: 22.1549
epoch: 27/951 | step: 6090/6480 | trn_loss: 21.3062 | val_loss: 20.9912
epoch: 27/951 | step: 6105/6480 | trn_loss: 21.0085 | val_loss: 22.5853
epoch: 27/951 | step: 6120/6480 | trn_loss: 20.3403 | val_loss: 

epoch: 28/951 | step: 1155/6480 | trn_loss: 20.6274 | val_loss: 21.9976
epoch: 28/951 | step: 1170/6480 | trn_loss: 21.3357 | val_loss: 22.3550
epoch: 28/951 | step: 1185/6480 | trn_loss: 20.6630 | val_loss: 21.0579
epoch: 28/951 | step: 1200/6480 | trn_loss: 20.3107 | val_loss: 23.0966
epoch: 28/951 | step: 1215/6480 | trn_loss: 21.0219 | val_loss: 21.5527
epoch: 28/951 | step: 1230/6480 | trn_loss: 20.9876 | val_loss: 22.0637
epoch: 28/951 | step: 1245/6480 | trn_loss: 20.5722 | val_loss: 21.5267
epoch: 28/951 | step: 1260/6480 | trn_loss: 20.4600 | val_loss: 21.4696
epoch: 28/951 | step: 1275/6480 | trn_loss: 20.3845 | val_loss: 21.4038
epoch: 28/951 | step: 1290/6480 | trn_loss: 20.2487 | val_loss: 21.6613
epoch: 28/951 | step: 1305/6480 | trn_loss: 20.4118 | val_loss: 22.0355
epoch: 28/951 | step: 1320/6480 | trn_loss: 20.7601 | val_loss: 21.5539
epoch: 28/951 | step: 1335/6480 | trn_loss: 20.5166 | val_loss: 21.7024
epoch: 28/951 | step: 1350/6480 | trn_loss: 19.9791 | val_loss: 

epoch: 28/951 | step: 2850/6480 | trn_loss: 20.3093 | val_loss: 21.2164
epoch: 28/951 | step: 2865/6480 | trn_loss: 20.1345 | val_loss: 21.0846
epoch: 28/951 | step: 2880/6480 | trn_loss: 20.4324 | val_loss: 20.8699
epoch: 28/951 | step: 2895/6480 | trn_loss: 19.9541 | val_loss: 20.7965
epoch: 28/951 | step: 2910/6480 | trn_loss: 19.6927 | val_loss: 21.2854
epoch: 28/951 | step: 2925/6480 | trn_loss: 20.9719 | val_loss: 21.5990
epoch: 28/951 | step: 2940/6480 | trn_loss: 20.4374 | val_loss: 21.4169
epoch: 28/951 | step: 2955/6480 | trn_loss: 19.2733 | val_loss: 21.1491
epoch: 28/951 | step: 2970/6480 | trn_loss: 19.6626 | val_loss: 20.9970
epoch: 28/951 | step: 2985/6480 | trn_loss: 20.2866 | val_loss: 20.2828
epoch: 28/951 | step: 3000/6480 | trn_loss: 20.4103 | val_loss: 21.6022
epoch: 28/951 | step: 3015/6480 | trn_loss: 20.5916 | val_loss: 21.1286
epoch: 28/951 | step: 3030/6480 | trn_loss: 21.0148 | val_loss: 21.5083
epoch: 28/951 | step: 3045/6480 | trn_loss: 20.5520 | val_loss: 

epoch: 28/951 | step: 4545/6480 | trn_loss: 20.0152 | val_loss: 21.0799
epoch: 28/951 | step: 4560/6480 | trn_loss: 20.9986 | val_loss: 21.0320
epoch: 28/951 | step: 4575/6480 | trn_loss: 20.1909 | val_loss: 21.5453
epoch: 28/951 | step: 4590/6480 | trn_loss: 20.2491 | val_loss: 21.7005
epoch: 28/951 | step: 4605/6480 | trn_loss: 22.0364 | val_loss: 21.6630
epoch: 28/951 | step: 4620/6480 | trn_loss: 20.4998 | val_loss: 21.2995
epoch: 28/951 | step: 4635/6480 | trn_loss: 20.2649 | val_loss: 21.1706
epoch: 28/951 | step: 4650/6480 | trn_loss: 20.4737 | val_loss: 21.9543
epoch: 28/951 | step: 4665/6480 | trn_loss: 20.4056 | val_loss: 20.8582
epoch: 28/951 | step: 4680/6480 | trn_loss: 19.8003 | val_loss: 20.4103
epoch: 28/951 | step: 4695/6480 | trn_loss: 20.1114 | val_loss: 20.8502
epoch: 28/951 | step: 4710/6480 | trn_loss: 21.3291 | val_loss: 21.3864
epoch: 28/951 | step: 4725/6480 | trn_loss: 20.7417 | val_loss: 21.6193
epoch: 28/951 | step: 4740/6480 | trn_loss: 20.0597 | val_loss: 

epoch: 28/951 | step: 6240/6480 | trn_loss: 20.0487 | val_loss: 20.6757
epoch: 28/951 | step: 6255/6480 | trn_loss: 20.1924 | val_loss: 20.4347
epoch: 28/951 | step: 6270/6480 | trn_loss: 19.8351 | val_loss: 21.6140
epoch: 28/951 | step: 6285/6480 | trn_loss: 20.4594 | val_loss: 27.0799
epoch: 28/951 | step: 6300/6480 | trn_loss: 21.5312 | val_loss: 21.6706
epoch: 28/951 | step: 6315/6480 | trn_loss: 20.3324 | val_loss: 21.9749
epoch: 28/951 | step: 6330/6480 | trn_loss: 20.5346 | val_loss: 20.5602
epoch: 28/951 | step: 6345/6480 | trn_loss: 20.4053 | val_loss: 21.9004
epoch: 28/951 | step: 6360/6480 | trn_loss: 20.5094 | val_loss: 21.4846
epoch: 28/951 | step: 6375/6480 | trn_loss: 19.9297 | val_loss: 21.8155
epoch: 28/951 | step: 6390/6480 | trn_loss: 20.9420 | val_loss: 22.0321
epoch: 28/951 | step: 6405/6480 | trn_loss: 20.7788 | val_loss: 21.9473
epoch: 28/951 | step: 6420/6480 | trn_loss: 20.9087 | val_loss: 27.7315
epoch: 28/951 | step: 6435/6480 | trn_loss: 20.9657 | val_loss: 

In [None]:
val_pred

In [None]:
val_y

In [None]:
trn_pred = model(trn_X.float())

In [None]:
trn_loss = mae(trn_pred.double(), trn_y.double())

In [None]:
plt.figure(figsize=(16,9))
x_range = range(len(trn_loss_list))
plt.plot(x_range, trn_loss_list, label="trn")
plt.plot(x_range, val_loss_list, label="val")
plt.legend()
plt.xlabel("training steps")
plt.ylabel("loss")