 <h1 style="text-align:center">最终结果</h1>
 <img src="result.png" style="width: 200px;">

In [334]:
# Numerical Operations
import math
import numpy as np

# Reading/Writing Data
import pandas as pd
import os
import csv

# For Progress Bar
from tqdm import tqdm

# Pytorch
import torch 
import torch.nn as nn
from torch.utils.data import Dataset, DataLoader, random_split

# For plotting learning curve
from torch.utils.tensorboard import SummaryWriter

In [335]:
def same_seed(seed): 
    '''Fixes random number generator seeds for reproducibility.'''
    torch.backends.cudnn.deterministic = True
    torch.backends.cudnn.benchmark = False
    np.random.seed(seed)
    torch.manual_seed(seed)
    if torch.cuda.is_available():
        torch.cuda.manual_seed_all(seed)

def train_valid_split(data_set, valid_ratio, seed):
    '''Split provided training data into training set and validation set'''
    valid_set_size = int(valid_ratio * len(data_set)) 
    train_set_size = len(data_set) - valid_set_size
    train_set, valid_set = random_split(data_set, [train_set_size, valid_set_size], generator=torch.Generator().manual_seed(seed))
    return np.array(train_set), np.array(valid_set)

def predict(test_loader, model, device):
    model.eval() # Set your model to evaluation mode.
    preds = []
    for x in tqdm(test_loader):
        x = x.to(device)                        
        with torch.no_grad():                   
            pred = model(x)                     
            preds.append(pred.detach().cpu())   
    preds = torch.cat(preds, dim=0).numpy()  
    return preds

In [336]:
class COVID19Dataset(Dataset):
    '''
    x: Features.
    y: Targets, if none, do prediction.
    '''
    def __init__(self, x, y=None):
        if y is None:
            self.y = y
        else:
            self.y = torch.FloatTensor(y)
        self.x = torch.FloatTensor(x)

    def __getitem__(self, idx):
        if self.y is None:
            return self.x[idx]
        else:
            return self.x[idx], self.y[idx]

    def __len__(self):
        return len(self.x)

In [337]:
class My_Model(nn.Module):
    def __init__(self, input_dim):
        super(My_Model, self).__init__()
        # TODO: modify model's structure, be aware of dimensions. 
        self.layers = nn.Sequential(
            nn.Linear(input_dim, 16),
            nn.ReLU(),
            nn.Linear(16, 8),
            nn.ReLU(),
            nn.Linear(8, 1)
        )
        self.criterion = nn.MSELoss(reduction='mean')

    def forward(self, x):
        x = self.layers(x)
        x = x.squeeze(1) # (B, 1) -> (B)
        return x
    def cal_loss(self,pred,target):
        return torch.sqrt(self.criterion(pred,target))

In [338]:
def select_feat(train_data, valid_data, test_data, select_all=True):
    '''Selects useful features to perform regression'''
    y_train, y_valid = train_data[:,-1], valid_data[:,-1]
    raw_x_train, raw_x_valid, raw_x_test = train_data[:,:-1], valid_data[:,:-1], test_data
    x = pd.read_csv('./covid.train.csv')
    y = pd.read_csv('./covid.test.csv')

    best_corr = x.corr()['tested_positive.4'].sort_values(ascending=False)[abs(x.corr()['tested_positive.4'].sort_values(ascending=False))>0.86].index[1:]
    idx = 0
    res_list = []
    for i in x.columns:
        if i in best_corr :
            res_list.append(idx)
        idx = idx+1
    feat_idx = res_list
    print(select_all)

    if select_all:
        feat_idx = list(range(raw_x_train.shape[1]))
    else:
        feat_idx = res_list # TODO: Select suitable feature columns.
        print(feat_idx)
        
    return raw_x_train[:,feat_idx], raw_x_valid[:,feat_idx], raw_x_test[:,feat_idx], y_train, y_valid

In [339]:
def trainer(train_loader, valid_loader, model, config, device):

    #criterion = nn.MSELoss(reduction='mean') # Define your loss function, do not modify this.

    # Define your optimization algorithm. 
    # TODO: Please check https://pytorch.org/docs/stable/optim.html to get more available algorithms.
    # TODO: L2 regularization (optimizer(weight decay...) or implement by your self).
    optimizer = torch.optim.Adam(model.parameters(), lr=config['learning_rate']) #momentum=0.9

    writer = SummaryWriter() # Writer of tensoboard.

    if not os.path.isdir('./models'):
        os.mkdir('./models') # Create directory of saving models.

    n_epochs, best_loss, step, early_stop_count = config['n_epochs'], math.inf, 0, 0

    for epoch in range(n_epochs):
        model.train() # Set your model to train mode.
        loss_record = []

        # tqdm is a package to visualize your training progress.
        train_pbar = tqdm(train_loader, position=0, leave=True)

        for x, y in train_pbar:
            optimizer.zero_grad()               # Set gradient to zero.
            x, y = x.to(device), y.to(device)   # Move your data to device. 
            pred = model(x)             
            loss = model.cal_loss(pred, y)
            loss.backward()                     # Compute gradient(backpropagation).
            optimizer.step()                    # Update parameters.
            step += 1
            loss_record.append(loss.detach().item())
            
            # Display current epoch number and loss on tqdm progress bar.
            train_pbar.set_description(f'Epoch [{epoch+1}/{n_epochs}]')
            train_pbar.set_postfix({'loss': loss.detach().item()})

        mean_train_loss = sum(loss_record)/len(loss_record)
        writer.add_scalar('Loss/train', mean_train_loss, step)

        model.eval() # Set your model to evaluation mode.
        loss_record = []
        for x, y in valid_loader:
            x, y = x.to(device), y.to(device)
            with torch.no_grad():
                pred = model(x)
                loss = model.cal_loss(pred, y)

            loss_record.append(loss.item())
            
        mean_valid_loss = sum(loss_record)/len(loss_record)
        print(f'Epoch [{epoch+1}/{n_epochs}]: Train loss: {mean_train_loss:.4f}, Valid loss: {mean_valid_loss:.4f}')
        writer.add_scalar('Loss/valid', mean_valid_loss, step)

        if mean_valid_loss < best_loss:
            best_loss = mean_valid_loss
            torch.save(model.state_dict(), config['save_path']) # Save your best model
            print('Saving model with loss {:.3f}...'.format(best_loss))
            early_stop_count = 0
        else: 
            early_stop_count += 1

        if early_stop_count >= config['early_stop']:
            print('\nModel is not improving, so we halt the training session.')
            return

In [340]:
device = 'cuda' if torch.cuda.is_available() else 'cpu'
config = {
    'seed': 5201314,      # Your seed number, you can pick your lucky number. :)
    'select_all': True,   # Whether to use all features.
    'valid_ratio': 0.01,   # validation_size = train_size * valid_ratio
    'n_epochs': 5000,     # Number of epochs.            
    'batch_size': 200, 
    'learning_rate': 1e-3,              
    'early_stop': 500,    # If model has not improved for this many consecutive epochs, stop training.     
    'save_path': './models/model.ckpt'  # Your model will be saved here.
}

In [341]:
# Set seed for reproducibility
same_seed(config['seed'])


# train_data size: 2699 x 118 (id + 37 states + 16 features x 5 days) 
# test_data size: 1078 x 117 (without last day's positive rate)
train_data, test_data = pd.read_csv('./covid.train.csv').values, pd.read_csv('./covid.test.csv').values
train_data, valid_data = train_valid_split(train_data, config['valid_ratio'], config['seed'])

# Print out the data size.
print(f"""train_data size: {train_data.shape} 
valid_data size: {valid_data.shape} 
test_data size: {test_data.shape}""")

# Select features
x_train, x_valid, x_test, y_train, y_valid = select_feat(train_data, valid_data, test_data, False)

# Print out the number of features.
print(f'number of features: {x_train.shape[1]}')

train_dataset, valid_dataset, test_dataset = COVID19Dataset(x_train, y_train), \
                                            COVID19Dataset(x_valid, y_valid), \
                                            COVID19Dataset(x_test)

# Pytorch data loader loads pytorch dataset into batches.
train_loader = DataLoader(train_dataset, batch_size=config['batch_size'], shuffle=True, pin_memory=True)
valid_loader = DataLoader(valid_dataset, batch_size=config['batch_size'], shuffle=True, pin_memory=True)
test_loader = DataLoader(test_dataset, batch_size=config['batch_size'], shuffle=False, pin_memory=True)

train_data size: (2673, 118) 
valid_data size: (26, 118) 
test_data size: (1078, 117)
False
[40, 41, 53, 56, 57, 69, 72, 73, 85, 87, 88, 89, 101, 102, 103, 104, 105]
number of features: 17


In [342]:
model = My_Model(input_dim=x_train.shape[1]).to(device) # put your model and data on the same computation device.
trainer(train_loader, valid_loader, model, config, device)

Epoch [1/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.08it/s, loss=5.3]


Epoch [1/5000]: Train loss: 7.6270, Valid loss: 4.2862
Saving model with loss 4.286...


Epoch [2/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.85it/s, loss=2.98]


Epoch [2/5000]: Train loss: 4.0894, Valid loss: 2.2300
Saving model with loss 2.230...


Epoch [3/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.01it/s, loss=2.57]


Epoch [3/5000]: Train loss: 2.6734, Valid loss: 2.8301


Epoch [4/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.74it/s, loss=2.4]


Epoch [4/5000]: Train loss: 2.5390, Valid loss: 2.2442


Epoch [5/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.45it/s, loss=2.72]


Epoch [5/5000]: Train loss: 2.4833, Valid loss: 2.3349


Epoch [6/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.82it/s, loss=2.72]


Epoch [6/5000]: Train loss: 2.4417, Valid loss: 2.3139


Epoch [7/5000]: 100%|██████████| 14/14 [00:00<00:00, 175.15it/s, loss=2.25]


Epoch [7/5000]: Train loss: 2.3929, Valid loss: 2.3010


Epoch [8/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.44it/s, loss=2.39]


Epoch [8/5000]: Train loss: 2.3656, Valid loss: 2.2639


Epoch [9/5000]: 100%|██████████| 14/14 [00:00<00:00, 173.77it/s, loss=2.5]


Epoch [9/5000]: Train loss: 2.3415, Valid loss: 2.2245
Saving model with loss 2.224...


Epoch [10/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.32it/s, loss=2.42]


Epoch [10/5000]: Train loss: 2.3041, Valid loss: 2.2066
Saving model with loss 2.207...


Epoch [11/5000]: 100%|██████████| 14/14 [00:00<00:00, 166.83it/s, loss=1.96]


Epoch [11/5000]: Train loss: 2.2483, Valid loss: 2.1874
Saving model with loss 2.187...


Epoch [12/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.79it/s, loss=1.84]


Epoch [12/5000]: Train loss: 2.2023, Valid loss: 2.1719
Saving model with loss 2.172...


Epoch [13/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.08it/s, loss=2.52]


Epoch [13/5000]: Train loss: 2.1934, Valid loss: 2.1238
Saving model with loss 2.124...


Epoch [14/5000]: 100%|██████████| 14/14 [00:00<00:00, 168.06it/s, loss=1.72]


Epoch [14/5000]: Train loss: 2.1167, Valid loss: 2.1016
Saving model with loss 2.102...


Epoch [15/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.24it/s, loss=2.04]


Epoch [15/5000]: Train loss: 2.0902, Valid loss: 2.0327
Saving model with loss 2.033...


Epoch [16/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.22it/s, loss=2.22]


Epoch [16/5000]: Train loss: 2.0593, Valid loss: 2.0193
Saving model with loss 2.019...


Epoch [17/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.29it/s, loss=2.29]


Epoch [17/5000]: Train loss: 2.0060, Valid loss: 1.9792
Saving model with loss 1.979...


Epoch [18/5000]: 100%|██████████| 14/14 [00:00<00:00, 152.19it/s, loss=2.12]


Epoch [18/5000]: Train loss: 1.9506, Valid loss: 1.9297
Saving model with loss 1.930...


Epoch [19/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.03it/s, loss=1.82]


Epoch [19/5000]: Train loss: 1.8821, Valid loss: 1.8094
Saving model with loss 1.809...


Epoch [20/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.39it/s, loss=1.73]


Epoch [20/5000]: Train loss: 1.8063, Valid loss: 1.7498
Saving model with loss 1.750...


Epoch [21/5000]: 100%|██████████| 14/14 [00:00<00:00, 169.48it/s, loss=1.71]


Epoch [21/5000]: Train loss: 1.7149, Valid loss: 1.7191
Saving model with loss 1.719...


Epoch [22/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.18it/s, loss=1.66]


Epoch [22/5000]: Train loss: 1.6206, Valid loss: 1.6347
Saving model with loss 1.635...


Epoch [23/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.93it/s, loss=1.5]


Epoch [23/5000]: Train loss: 1.5265, Valid loss: 1.5497
Saving model with loss 1.550...


Epoch [24/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.60it/s, loss=1.5]


Epoch [24/5000]: Train loss: 1.4694, Valid loss: 1.4568
Saving model with loss 1.457...


Epoch [25/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.88it/s, loss=1.66]


Epoch [25/5000]: Train loss: 1.4437, Valid loss: 1.5073


Epoch [26/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.50it/s, loss=1.41]


Epoch [26/5000]: Train loss: 1.4084, Valid loss: 1.3929
Saving model with loss 1.393...


Epoch [27/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.15it/s, loss=1.21]


Epoch [27/5000]: Train loss: 1.3709, Valid loss: 1.3685
Saving model with loss 1.369...


Epoch [28/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.00it/s, loss=1.21]


Epoch [28/5000]: Train loss: 1.3563, Valid loss: 1.4005


Epoch [29/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.59it/s, loss=1.19]


Epoch [29/5000]: Train loss: 1.3425, Valid loss: 1.3314
Saving model with loss 1.331...


Epoch [30/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.06it/s, loss=1.35]


Epoch [30/5000]: Train loss: 1.3395, Valid loss: 1.3077
Saving model with loss 1.308...


Epoch [31/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.71it/s, loss=1.32]


Epoch [31/5000]: Train loss: 1.3264, Valid loss: 1.3026
Saving model with loss 1.303...


Epoch [32/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.09it/s, loss=1.06]


Epoch [32/5000]: Train loss: 1.2990, Valid loss: 1.3481


Epoch [33/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.35it/s, loss=1.47]


Epoch [33/5000]: Train loss: 1.3076, Valid loss: 1.3417


Epoch [34/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.88it/s, loss=1.29]


Epoch [34/5000]: Train loss: 1.2978, Valid loss: 1.2758
Saving model with loss 1.276...


Epoch [35/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.69it/s, loss=1.3]


Epoch [35/5000]: Train loss: 1.2906, Valid loss: 1.2489
Saving model with loss 1.249...


Epoch [36/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.72it/s, loss=1.48]


Epoch [36/5000]: Train loss: 1.2754, Valid loss: 1.2463
Saving model with loss 1.246...


Epoch [37/5000]: 100%|██████████| 14/14 [00:00<00:00, 154.52it/s, loss=1.4]


Epoch [37/5000]: Train loss: 1.2626, Valid loss: 1.2512


Epoch [38/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.84it/s, loss=1.02]


Epoch [38/5000]: Train loss: 1.2370, Valid loss: 1.3042


Epoch [39/5000]: 100%|██████████| 14/14 [00:00<00:00, 147.20it/s, loss=1.34]


Epoch [39/5000]: Train loss: 1.2464, Valid loss: 1.2183
Saving model with loss 1.218...


Epoch [40/5000]: 100%|██████████| 14/14 [00:00<00:00, 169.89it/s, loss=1.34]


Epoch [40/5000]: Train loss: 1.2366, Valid loss: 1.2053
Saving model with loss 1.205...


Epoch [41/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.57it/s, loss=1.2]


Epoch [41/5000]: Train loss: 1.2199, Valid loss: 1.2011
Saving model with loss 1.201...


Epoch [42/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.04it/s, loss=1.04]


Epoch [42/5000]: Train loss: 1.2021, Valid loss: 1.2336


Epoch [43/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.14it/s, loss=1.03]


Epoch [43/5000]: Train loss: 1.2232, Valid loss: 1.1991
Saving model with loss 1.199...


Epoch [44/5000]: 100%|██████████| 14/14 [00:00<00:00, 155.35it/s, loss=1.24]


Epoch [44/5000]: Train loss: 1.2201, Valid loss: 1.1867
Saving model with loss 1.187...


Epoch [45/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.71it/s, loss=1.07]


Epoch [45/5000]: Train loss: 1.2143, Valid loss: 1.1748
Saving model with loss 1.175...


Epoch [46/5000]: 100%|██████████| 14/14 [00:00<00:00, 170.43it/s, loss=1.1]


Epoch [46/5000]: Train loss: 1.1925, Valid loss: 1.2229


Epoch [47/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.81it/s, loss=1.26]


Epoch [47/5000]: Train loss: 1.1885, Valid loss: 1.1553
Saving model with loss 1.155...


Epoch [48/5000]: 100%|██████████| 14/14 [00:00<00:00, 169.96it/s, loss=1.04]


Epoch [48/5000]: Train loss: 1.1685, Valid loss: 1.1476
Saving model with loss 1.148...


Epoch [49/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.56it/s, loss=1.36]


Epoch [49/5000]: Train loss: 1.1789, Valid loss: 1.1349
Saving model with loss 1.135...


Epoch [50/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.83it/s, loss=1.15]


Epoch [50/5000]: Train loss: 1.1615, Valid loss: 1.1436


Epoch [51/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.43it/s, loss=0.945]


Epoch [51/5000]: Train loss: 1.1500, Valid loss: 1.1776


Epoch [52/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.41it/s, loss=1.52]


Epoch [52/5000]: Train loss: 1.1766, Valid loss: 1.1536


Epoch [53/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.71it/s, loss=1.48]


Epoch [53/5000]: Train loss: 1.1748, Valid loss: 1.1149
Saving model with loss 1.115...


Epoch [54/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.72it/s, loss=1.24]


Epoch [54/5000]: Train loss: 1.1514, Valid loss: 1.1041
Saving model with loss 1.104...


Epoch [55/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.33it/s, loss=1.1]


Epoch [55/5000]: Train loss: 1.1462, Valid loss: 1.1008
Saving model with loss 1.101...


Epoch [56/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.14it/s, loss=1.12]


Epoch [56/5000]: Train loss: 1.1457, Valid loss: 1.1415


Epoch [57/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.78it/s, loss=1.12]


Epoch [57/5000]: Train loss: 1.1477, Valid loss: 1.0975
Saving model with loss 1.098...


Epoch [58/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.01it/s, loss=0.906]


Epoch [58/5000]: Train loss: 1.1287, Valid loss: 1.0961
Saving model with loss 1.096...


Epoch [59/5000]: 100%|██████████| 14/14 [00:00<00:00, 118.76it/s, loss=0.977]


Epoch [59/5000]: Train loss: 1.1437, Valid loss: 1.1010


Epoch [60/5000]: 100%|██████████| 14/14 [00:00<00:00, 164.50it/s, loss=1.43]


Epoch [60/5000]: Train loss: 1.1428, Valid loss: 1.1288


Epoch [61/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.63it/s, loss=0.946]


Epoch [61/5000]: Train loss: 1.1291, Valid loss: 1.0777
Saving model with loss 1.078...


Epoch [62/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.73it/s, loss=1.04]


Epoch [62/5000]: Train loss: 1.1480, Valid loss: 1.0868


Epoch [63/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.25it/s, loss=1.25]


Epoch [63/5000]: Train loss: 1.1351, Valid loss: 1.0847


Epoch [64/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.70it/s, loss=1.05]


Epoch [64/5000]: Train loss: 1.1217, Valid loss: 1.0862


Epoch [65/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.64it/s, loss=1.11]


Epoch [65/5000]: Train loss: 1.1194, Valid loss: 1.0723
Saving model with loss 1.072...


Epoch [66/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.18it/s, loss=1.01]


Epoch [66/5000]: Train loss: 1.1172, Valid loss: 1.0769


Epoch [67/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.69it/s, loss=1.03]


Epoch [67/5000]: Train loss: 1.1111, Valid loss: 1.0816


Epoch [68/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.09it/s, loss=1.14]


Epoch [68/5000]: Train loss: 1.1237, Valid loss: 1.0611
Saving model with loss 1.061...


Epoch [69/5000]: 100%|██████████| 14/14 [00:00<00:00, 173.58it/s, loss=1.15]


Epoch [69/5000]: Train loss: 1.1116, Valid loss: 1.0892


Epoch [70/5000]: 100%|██████████| 14/14 [00:00<00:00, 175.33it/s, loss=1.32]


Epoch [70/5000]: Train loss: 1.1236, Valid loss: 1.0600
Saving model with loss 1.060...


Epoch [71/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.41it/s, loss=1.27]


Epoch [71/5000]: Train loss: 1.1434, Valid loss: 1.1008


Epoch [72/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.83it/s, loss=1.19]


Epoch [72/5000]: Train loss: 1.1410, Valid loss: 1.1041


Epoch [73/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.59it/s, loss=1.23]


Epoch [73/5000]: Train loss: 1.1288, Valid loss: 1.0456
Saving model with loss 1.046...


Epoch [74/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.45it/s, loss=0.943]


Epoch [74/5000]: Train loss: 1.1042, Valid loss: 1.0578


Epoch [75/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.15it/s, loss=0.856]


Epoch [75/5000]: Train loss: 1.0945, Valid loss: 1.0602


Epoch [76/5000]: 100%|██████████| 14/14 [00:00<00:00, 159.94it/s, loss=1.33]


Epoch [76/5000]: Train loss: 1.1149, Valid loss: 1.0544


Epoch [77/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.21it/s, loss=1.01]


Epoch [77/5000]: Train loss: 1.0991, Valid loss: 1.0477


Epoch [78/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.39it/s, loss=1.13]


Epoch [78/5000]: Train loss: 1.1046, Valid loss: 1.0380
Saving model with loss 1.038...


Epoch [79/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.91it/s, loss=0.873]


Epoch [79/5000]: Train loss: 1.0852, Valid loss: 1.0416


Epoch [80/5000]: 100%|██████████| 14/14 [00:00<00:00, 152.44it/s, loss=0.942]


Epoch [80/5000]: Train loss: 1.0963, Valid loss: 1.0785


Epoch [81/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.72it/s, loss=0.962]


Epoch [81/5000]: Train loss: 1.0988, Valid loss: 1.0322
Saving model with loss 1.032...


Epoch [82/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.82it/s, loss=1.14]


Epoch [82/5000]: Train loss: 1.1230, Valid loss: 1.0401


Epoch [83/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.26it/s, loss=1.07]


Epoch [83/5000]: Train loss: 1.0988, Valid loss: 1.0956


Epoch [84/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.39it/s, loss=1]


Epoch [84/5000]: Train loss: 1.0961, Valid loss: 1.0435


Epoch [85/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.38it/s, loss=1.02]


Epoch [85/5000]: Train loss: 1.0889, Valid loss: 1.0279
Saving model with loss 1.028...


Epoch [86/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.44it/s, loss=1.11]


Epoch [86/5000]: Train loss: 1.1136, Valid loss: 1.0493


Epoch [87/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.30it/s, loss=1.07]


Epoch [87/5000]: Train loss: 1.0967, Valid loss: 1.0342


Epoch [88/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.59it/s, loss=1.03]


Epoch [88/5000]: Train loss: 1.0888, Valid loss: 1.0294


Epoch [89/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.24it/s, loss=1.04]


Epoch [89/5000]: Train loss: 1.0857, Valid loss: 1.0235
Saving model with loss 1.024...


Epoch [90/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.92it/s, loss=1.13]


Epoch [90/5000]: Train loss: 1.0914, Valid loss: 1.0254


Epoch [91/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.29it/s, loss=1.25]


Epoch [91/5000]: Train loss: 1.1035, Valid loss: 1.0800


Epoch [92/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.37it/s, loss=1.11]


Epoch [92/5000]: Train loss: 1.0942, Valid loss: 1.0167
Saving model with loss 1.017...


Epoch [93/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.75it/s, loss=1.04]


Epoch [93/5000]: Train loss: 1.0938, Valid loss: 1.0315


Epoch [94/5000]: 100%|██████████| 14/14 [00:00<00:00, 167.63it/s, loss=0.99]


Epoch [94/5000]: Train loss: 1.0878, Valid loss: 1.1442


Epoch [95/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.91it/s, loss=1.42]


Epoch [95/5000]: Train loss: 1.1167, Valid loss: 1.0342


Epoch [96/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.94it/s, loss=0.992]


Epoch [96/5000]: Train loss: 1.0847, Valid loss: 1.0221


Epoch [97/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.07it/s, loss=1.02]


Epoch [97/5000]: Train loss: 1.0836, Valid loss: 1.0193


Epoch [98/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.66it/s, loss=1.07]


Epoch [98/5000]: Train loss: 1.0932, Valid loss: 1.0583


Epoch [99/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.28it/s, loss=1.09]


Epoch [99/5000]: Train loss: 1.1070, Valid loss: 1.0301


Epoch [100/5000]: 100%|██████████| 14/14 [00:00<00:00, 163.01it/s, loss=1.14]


Epoch [100/5000]: Train loss: 1.0903, Valid loss: 1.0404


Epoch [101/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.40it/s, loss=1.14]


Epoch [101/5000]: Train loss: 1.0841, Valid loss: 1.0177


Epoch [102/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.49it/s, loss=0.998]


Epoch [102/5000]: Train loss: 1.0800, Valid loss: 1.0130
Saving model with loss 1.013...


Epoch [103/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.72it/s, loss=1.05]


Epoch [103/5000]: Train loss: 1.1041, Valid loss: 1.0470


Epoch [104/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.90it/s, loss=1.11]


Epoch [104/5000]: Train loss: 1.0854, Valid loss: 1.0233


Epoch [105/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.98it/s, loss=1.24]


Epoch [105/5000]: Train loss: 1.0882, Valid loss: 1.0217


Epoch [106/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.79it/s, loss=1.25]


Epoch [106/5000]: Train loss: 1.0905, Valid loss: 1.0109
Saving model with loss 1.011...


Epoch [107/5000]: 100%|██████████| 14/14 [00:00<00:00, 165.37it/s, loss=1.05]


Epoch [107/5000]: Train loss: 1.0816, Valid loss: 1.0361


Epoch [108/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.34it/s, loss=1.01]


Epoch [108/5000]: Train loss: 1.0891, Valid loss: 1.0532


Epoch [109/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.32it/s, loss=1.05]


Epoch [109/5000]: Train loss: 1.0741, Valid loss: 1.0508


Epoch [110/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.53it/s, loss=1.09]


Epoch [110/5000]: Train loss: 1.0797, Valid loss: 1.0051
Saving model with loss 1.005...


Epoch [111/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.26it/s, loss=1.19]


Epoch [111/5000]: Train loss: 1.0848, Valid loss: 1.0084


Epoch [112/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.23it/s, loss=0.972]


Epoch [112/5000]: Train loss: 1.0716, Valid loss: 1.0033
Saving model with loss 1.003...


Epoch [113/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.27it/s, loss=0.934]


Epoch [113/5000]: Train loss: 1.0761, Valid loss: 1.0362


Epoch [114/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.22it/s, loss=1.11]


Epoch [114/5000]: Train loss: 1.0761, Valid loss: 1.0588


Epoch [115/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.86it/s, loss=1.03]


Epoch [115/5000]: Train loss: 1.0734, Valid loss: 1.0067


Epoch [116/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.61it/s, loss=1.11]


Epoch [116/5000]: Train loss: 1.0792, Valid loss: 1.0032
Saving model with loss 1.003...


Epoch [117/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.71it/s, loss=1.11]


Epoch [117/5000]: Train loss: 1.0757, Valid loss: 1.0035


Epoch [118/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.79it/s, loss=1.1]


Epoch [118/5000]: Train loss: 1.0742, Valid loss: 1.0699


Epoch [119/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.22it/s, loss=0.915]


Epoch [119/5000]: Train loss: 1.0796, Valid loss: 1.0026
Saving model with loss 1.003...


Epoch [120/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.00it/s, loss=1.08]


Epoch [120/5000]: Train loss: 1.0771, Valid loss: 1.0064


Epoch [121/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.09it/s, loss=1.04]


Epoch [121/5000]: Train loss: 1.0770, Valid loss: 1.0001
Saving model with loss 1.000...


Epoch [122/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.83it/s, loss=0.841]


Epoch [122/5000]: Train loss: 1.0841, Valid loss: 1.0354


Epoch [123/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.42it/s, loss=1.09]


Epoch [123/5000]: Train loss: 1.0833, Valid loss: 0.9954
Saving model with loss 0.995...


Epoch [124/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.69it/s, loss=0.915]


Epoch [124/5000]: Train loss: 1.0646, Valid loss: 0.9990


Epoch [125/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.53it/s, loss=1.16]


Epoch [125/5000]: Train loss: 1.0721, Valid loss: 1.0064


Epoch [126/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.44it/s, loss=0.967]


Epoch [126/5000]: Train loss: 1.0674, Valid loss: 1.0374


Epoch [127/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.68it/s, loss=1.1]


Epoch [127/5000]: Train loss: 1.0800, Valid loss: 1.0033


Epoch [128/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.49it/s, loss=1.12]


Epoch [128/5000]: Train loss: 1.0908, Valid loss: 1.0511


Epoch [129/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.44it/s, loss=1.17]


Epoch [129/5000]: Train loss: 1.0819, Valid loss: 0.9992


Epoch [130/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.26it/s, loss=1.11]


Epoch [130/5000]: Train loss: 1.0765, Valid loss: 1.0516


Epoch [131/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.25it/s, loss=0.957]


Epoch [131/5000]: Train loss: 1.0777, Valid loss: 0.9963


Epoch [132/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.91it/s, loss=1.11]


Epoch [132/5000]: Train loss: 1.0701, Valid loss: 0.9982


Epoch [133/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.82it/s, loss=1.03]


Epoch [133/5000]: Train loss: 1.0802, Valid loss: 1.0022


Epoch [134/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.86it/s, loss=1.04]


Epoch [134/5000]: Train loss: 1.0689, Valid loss: 0.9912
Saving model with loss 0.991...


Epoch [135/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.60it/s, loss=1.12]


Epoch [135/5000]: Train loss: 1.0717, Valid loss: 0.9911
Saving model with loss 0.991...


Epoch [136/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.75it/s, loss=1.26]


Epoch [136/5000]: Train loss: 1.0768, Valid loss: 0.9930


Epoch [137/5000]: 100%|██████████| 14/14 [00:00<00:00, 166.52it/s, loss=1.31]


Epoch [137/5000]: Train loss: 1.0857, Valid loss: 0.9991


Epoch [138/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.67it/s, loss=0.909]


Epoch [138/5000]: Train loss: 1.0650, Valid loss: 1.0021


Epoch [139/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.53it/s, loss=1.08]


Epoch [139/5000]: Train loss: 1.0686, Valid loss: 0.9889
Saving model with loss 0.989...


Epoch [140/5000]: 100%|██████████| 14/14 [00:00<00:00, 214.08it/s, loss=0.976]


Epoch [140/5000]: Train loss: 1.0630, Valid loss: 1.0053


Epoch [141/5000]: 100%|██████████| 14/14 [00:00<00:00, 210.29it/s, loss=1.01]


Epoch [141/5000]: Train loss: 1.0626, Valid loss: 0.9936


Epoch [142/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.20it/s, loss=1]


Epoch [142/5000]: Train loss: 1.0741, Valid loss: 0.9875
Saving model with loss 0.988...


Epoch [143/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.21it/s, loss=0.954]


Epoch [143/5000]: Train loss: 1.0654, Valid loss: 1.0093


Epoch [144/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.95it/s, loss=1.38]


Epoch [144/5000]: Train loss: 1.0746, Valid loss: 0.9974


Epoch [145/5000]: 100%|██████████| 14/14 [00:00<00:00, 167.20it/s, loss=1.24]


Epoch [145/5000]: Train loss: 1.0704, Valid loss: 1.0168


Epoch [146/5000]: 100%|██████████| 14/14 [00:00<00:00, 162.87it/s, loss=1.21]


Epoch [146/5000]: Train loss: 1.0689, Valid loss: 1.0354


Epoch [147/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.16it/s, loss=1.41]


Epoch [147/5000]: Train loss: 1.0785, Valid loss: 1.0042


Epoch [148/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.01it/s, loss=0.996]


Epoch [148/5000]: Train loss: 1.0561, Valid loss: 0.9833
Saving model with loss 0.983...


Epoch [149/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.78it/s, loss=1.02]


Epoch [149/5000]: Train loss: 1.0676, Valid loss: 0.9996


Epoch [150/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.83it/s, loss=0.891]


Epoch [150/5000]: Train loss: 1.0583, Valid loss: 0.9824
Saving model with loss 0.982...


Epoch [151/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.78it/s, loss=1.27]


Epoch [151/5000]: Train loss: 1.0744, Valid loss: 0.9917


Epoch [152/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.91it/s, loss=1.05]


Epoch [152/5000]: Train loss: 1.0804, Valid loss: 1.0331


Epoch [153/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.58it/s, loss=0.919]


Epoch [153/5000]: Train loss: 1.0638, Valid loss: 0.9830


Epoch [154/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.04it/s, loss=0.981]


Epoch [154/5000]: Train loss: 1.0602, Valid loss: 0.9975


Epoch [155/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.56it/s, loss=1.11]


Epoch [155/5000]: Train loss: 1.0624, Valid loss: 0.9836


Epoch [156/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.36it/s, loss=1.08]


Epoch [156/5000]: Train loss: 1.0606, Valid loss: 1.0851


Epoch [157/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.13it/s, loss=1.1]


Epoch [157/5000]: Train loss: 1.0946, Valid loss: 0.9806
Saving model with loss 0.981...


Epoch [158/5000]: 100%|██████████| 14/14 [00:00<00:00, 175.68it/s, loss=0.904]


Epoch [158/5000]: Train loss: 1.0595, Valid loss: 0.9813


Epoch [159/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.95it/s, loss=1.25]


Epoch [159/5000]: Train loss: 1.0756, Valid loss: 1.0620


Epoch [160/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.03it/s, loss=1.06]


Epoch [160/5000]: Train loss: 1.0810, Valid loss: 0.9799
Saving model with loss 0.980...


Epoch [161/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.05it/s, loss=1.09]


Epoch [161/5000]: Train loss: 1.0700, Valid loss: 0.9976


Epoch [162/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.27it/s, loss=0.98]


Epoch [162/5000]: Train loss: 1.0564, Valid loss: 1.0297


Epoch [163/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.14it/s, loss=1.12]


Epoch [163/5000]: Train loss: 1.0651, Valid loss: 0.9947


Epoch [164/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.12it/s, loss=1.03]


Epoch [164/5000]: Train loss: 1.0543, Valid loss: 0.9794
Saving model with loss 0.979...


Epoch [165/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.73it/s, loss=1.19]


Epoch [165/5000]: Train loss: 1.0669, Valid loss: 1.0100


Epoch [166/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.87it/s, loss=0.951]


Epoch [166/5000]: Train loss: 1.0561, Valid loss: 1.0106


Epoch [167/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.81it/s, loss=1.17]


Epoch [167/5000]: Train loss: 1.0747, Valid loss: 1.0023


Epoch [168/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.22it/s, loss=0.957]


Epoch [168/5000]: Train loss: 1.0764, Valid loss: 1.0285


Epoch [169/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.98it/s, loss=1.08]


Epoch [169/5000]: Train loss: 1.0691, Valid loss: 1.0104


Epoch [170/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.26it/s, loss=1.06]


Epoch [170/5000]: Train loss: 1.0661, Valid loss: 0.9827


Epoch [171/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.48it/s, loss=0.83]


Epoch [171/5000]: Train loss: 1.0613, Valid loss: 0.9814


Epoch [172/5000]: 100%|██████████| 14/14 [00:00<00:00, 211.21it/s, loss=1.16]


Epoch [172/5000]: Train loss: 1.0718, Valid loss: 0.9790
Saving model with loss 0.979...


Epoch [173/5000]: 100%|██████████| 14/14 [00:00<00:00, 111.68it/s, loss=0.837]


Epoch [173/5000]: Train loss: 1.0517, Valid loss: 0.9942


Epoch [174/5000]: 100%|██████████| 14/14 [00:00<00:00, 167.24it/s, loss=0.991]


Epoch [174/5000]: Train loss: 1.0582, Valid loss: 0.9813


Epoch [175/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.06it/s, loss=0.963]


Epoch [175/5000]: Train loss: 1.0538, Valid loss: 0.9810


Epoch [176/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.70it/s, loss=1.05]


Epoch [176/5000]: Train loss: 1.0562, Valid loss: 1.0444


Epoch [177/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.45it/s, loss=1.09]


Epoch [177/5000]: Train loss: 1.0762, Valid loss: 0.9760
Saving model with loss 0.976...


Epoch [178/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.56it/s, loss=1.08]


Epoch [178/5000]: Train loss: 1.0620, Valid loss: 0.9838


Epoch [179/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.68it/s, loss=0.937]


Epoch [179/5000]: Train loss: 1.0895, Valid loss: 1.1514


Epoch [180/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.65it/s, loss=1.19]


Epoch [180/5000]: Train loss: 1.1126, Valid loss: 0.9809


Epoch [181/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.38it/s, loss=1.11]


Epoch [181/5000]: Train loss: 1.0648, Valid loss: 0.9810


Epoch [182/5000]: 100%|██████████| 14/14 [00:00<00:00, 151.87it/s, loss=0.962]


Epoch [182/5000]: Train loss: 1.0554, Valid loss: 0.9952


Epoch [183/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.95it/s, loss=1.13]


Epoch [183/5000]: Train loss: 1.0616, Valid loss: 0.9803


Epoch [184/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.11it/s, loss=1]


Epoch [184/5000]: Train loss: 1.0522, Valid loss: 0.9980


Epoch [185/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.21it/s, loss=1.1]


Epoch [185/5000]: Train loss: 1.0554, Valid loss: 0.9779


Epoch [186/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.33it/s, loss=1.09]


Epoch [186/5000]: Train loss: 1.0607, Valid loss: 0.9935


Epoch [187/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.10it/s, loss=0.99]


Epoch [187/5000]: Train loss: 1.0549, Valid loss: 0.9957


Epoch [188/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.04it/s, loss=1.13]


Epoch [188/5000]: Train loss: 1.0566, Valid loss: 1.0184


Epoch [189/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.45it/s, loss=1.1]


Epoch [189/5000]: Train loss: 1.0609, Valid loss: 0.9776


Epoch [190/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.67it/s, loss=0.928]


Epoch [190/5000]: Train loss: 1.0503, Valid loss: 0.9770


Epoch [191/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.14it/s, loss=1]


Epoch [191/5000]: Train loss: 1.0691, Valid loss: 1.0156


Epoch [192/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.06it/s, loss=1.1]


Epoch [192/5000]: Train loss: 1.0725, Valid loss: 0.9873


Epoch [193/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.36it/s, loss=1.08]


Epoch [193/5000]: Train loss: 1.0546, Valid loss: 0.9729
Saving model with loss 0.973...


Epoch [194/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.56it/s, loss=0.949]


Epoch [194/5000]: Train loss: 1.0501, Valid loss: 0.9827


Epoch [195/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.89it/s, loss=1.17]


Epoch [195/5000]: Train loss: 1.0616, Valid loss: 0.9697
Saving model with loss 0.970...


Epoch [196/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.23it/s, loss=0.968]


Epoch [196/5000]: Train loss: 1.0755, Valid loss: 0.9860


Epoch [197/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.16it/s, loss=0.909]


Epoch [197/5000]: Train loss: 1.0463, Valid loss: 0.9867


Epoch [198/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.09it/s, loss=1.12]


Epoch [198/5000]: Train loss: 1.0647, Valid loss: 0.9907


Epoch [199/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.57it/s, loss=1.08]


Epoch [199/5000]: Train loss: 1.0558, Valid loss: 0.9726


Epoch [200/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.93it/s, loss=0.935]


Epoch [200/5000]: Train loss: 1.0483, Valid loss: 0.9787


Epoch [201/5000]: 100%|██████████| 14/14 [00:00<00:00, 167.76it/s, loss=0.923]


Epoch [201/5000]: Train loss: 1.0484, Valid loss: 0.9697


Epoch [202/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.15it/s, loss=0.984]


Epoch [202/5000]: Train loss: 1.0525, Valid loss: 0.9702


Epoch [203/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.79it/s, loss=1.21]


Epoch [203/5000]: Train loss: 1.0700, Valid loss: 0.9862


Epoch [204/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.70it/s, loss=0.901]


Epoch [204/5000]: Train loss: 1.0558, Valid loss: 1.0014


Epoch [205/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.92it/s, loss=1.2]


Epoch [205/5000]: Train loss: 1.0647, Valid loss: 0.9942


Epoch [206/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.52it/s, loss=0.784]


Epoch [206/5000]: Train loss: 1.0390, Valid loss: 0.9690
Saving model with loss 0.969...


Epoch [207/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.03it/s, loss=1.11]


Epoch [207/5000]: Train loss: 1.0554, Valid loss: 0.9813


Epoch [208/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.26it/s, loss=0.883]


Epoch [208/5000]: Train loss: 1.0613, Valid loss: 0.9725


Epoch [209/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.39it/s, loss=1.09]


Epoch [209/5000]: Train loss: 1.0741, Valid loss: 0.9718


Epoch [210/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.22it/s, loss=1.03]


Epoch [210/5000]: Train loss: 1.0568, Valid loss: 0.9965


Epoch [211/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.46it/s, loss=0.785]


Epoch [211/5000]: Train loss: 1.0400, Valid loss: 1.0158


Epoch [212/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.17it/s, loss=1.07]


Epoch [212/5000]: Train loss: 1.0629, Valid loss: 0.9644
Saving model with loss 0.964...


Epoch [213/5000]: 100%|██████████| 14/14 [00:00<00:00, 155.92it/s, loss=1.05]


Epoch [213/5000]: Train loss: 1.0575, Valid loss: 0.9793


Epoch [214/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.50it/s, loss=0.986]


Epoch [214/5000]: Train loss: 1.0565, Valid loss: 0.9645


Epoch [215/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.73it/s, loss=1.03]


Epoch [215/5000]: Train loss: 1.0680, Valid loss: 1.0261


Epoch [216/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.54it/s, loss=0.918]


Epoch [216/5000]: Train loss: 1.0541, Valid loss: 0.9739


Epoch [217/5000]: 100%|██████████| 14/14 [00:00<00:00, 173.00it/s, loss=1.19]


Epoch [217/5000]: Train loss: 1.0735, Valid loss: 0.9695


Epoch [218/5000]: 100%|██████████| 14/14 [00:00<00:00, 134.70it/s, loss=1.15]


Epoch [218/5000]: Train loss: 1.0736, Valid loss: 1.0653


Epoch [219/5000]: 100%|██████████| 14/14 [00:00<00:00, 173.42it/s, loss=0.926]


Epoch [219/5000]: Train loss: 1.0631, Valid loss: 0.9663


Epoch [220/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.54it/s, loss=0.835]


Epoch [220/5000]: Train loss: 1.0466, Valid loss: 0.9696


Epoch [221/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.53it/s, loss=0.953]


Epoch [221/5000]: Train loss: 1.0472, Valid loss: 0.9927


Epoch [222/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.30it/s, loss=1.04]


Epoch [222/5000]: Train loss: 1.0544, Valid loss: 0.9880


Epoch [223/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.87it/s, loss=0.958]


Epoch [223/5000]: Train loss: 1.0500, Valid loss: 1.0141


Epoch [224/5000]: 100%|██████████| 14/14 [00:00<00:00, 156.47it/s, loss=0.939]


Epoch [224/5000]: Train loss: 1.0584, Valid loss: 0.9780


Epoch [225/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.98it/s, loss=1.01]


Epoch [225/5000]: Train loss: 1.0581, Valid loss: 0.9769


Epoch [226/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.94it/s, loss=0.867]


Epoch [226/5000]: Train loss: 1.0479, Valid loss: 0.9673


Epoch [227/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.06it/s, loss=1.06]


Epoch [227/5000]: Train loss: 1.0582, Valid loss: 0.9852


Epoch [228/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.62it/s, loss=0.97]


Epoch [228/5000]: Train loss: 1.0550, Valid loss: 0.9749


Epoch [229/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.69it/s, loss=0.977]


Epoch [229/5000]: Train loss: 1.0598, Valid loss: 0.9620
Saving model with loss 0.962...


Epoch [230/5000]: 100%|██████████| 14/14 [00:00<00:00, 131.93it/s, loss=1.04]


Epoch [230/5000]: Train loss: 1.0539, Valid loss: 1.0084


Epoch [231/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.80it/s, loss=1.13]


Epoch [231/5000]: Train loss: 1.0656, Valid loss: 0.9607
Saving model with loss 0.961...


Epoch [232/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.25it/s, loss=1.13]


Epoch [232/5000]: Train loss: 1.0549, Valid loss: 1.0044


Epoch [233/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.15it/s, loss=1.13]


Epoch [233/5000]: Train loss: 1.0568, Valid loss: 0.9802


Epoch [234/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.14it/s, loss=0.867]


Epoch [234/5000]: Train loss: 1.0440, Valid loss: 0.9583
Saving model with loss 0.958...


Epoch [235/5000]: 100%|██████████| 14/14 [00:00<00:00, 172.18it/s, loss=1.1]


Epoch [235/5000]: Train loss: 1.0626, Valid loss: 1.0234


Epoch [236/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.53it/s, loss=0.785]


Epoch [236/5000]: Train loss: 1.0475, Valid loss: 0.9621


Epoch [237/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.24it/s, loss=0.916]


Epoch [237/5000]: Train loss: 1.0517, Valid loss: 1.0157


Epoch [238/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.62it/s, loss=1.34]


Epoch [238/5000]: Train loss: 1.0699, Valid loss: 0.9708


Epoch [239/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.76it/s, loss=1.05]


Epoch [239/5000]: Train loss: 1.0530, Valid loss: 0.9663


Epoch [240/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.16it/s, loss=1.03]


Epoch [240/5000]: Train loss: 1.0532, Valid loss: 1.0177


Epoch [241/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.05it/s, loss=1.01]


Epoch [241/5000]: Train loss: 1.0521, Valid loss: 0.9713


Epoch [242/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.01it/s, loss=0.932]


Epoch [242/5000]: Train loss: 1.0551, Valid loss: 0.9811


Epoch [243/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.70it/s, loss=1.17]


Epoch [243/5000]: Train loss: 1.0668, Valid loss: 0.9579
Saving model with loss 0.958...


Epoch [244/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.89it/s, loss=1.23]


Epoch [244/5000]: Train loss: 1.0597, Valid loss: 0.9906


Epoch [245/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.49it/s, loss=1.03]


Epoch [245/5000]: Train loss: 1.0482, Valid loss: 1.0023


Epoch [246/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.05it/s, loss=1.11]


Epoch [246/5000]: Train loss: 1.0641, Valid loss: 0.9680


Epoch [247/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.57it/s, loss=1.19]


Epoch [247/5000]: Train loss: 1.0551, Valid loss: 1.0063


Epoch [248/5000]: 100%|██████████| 14/14 [00:00<00:00, 159.74it/s, loss=0.998]


Epoch [248/5000]: Train loss: 1.0572, Valid loss: 0.9549
Saving model with loss 0.955...


Epoch [249/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.70it/s, loss=1.15]


Epoch [249/5000]: Train loss: 1.0601, Valid loss: 0.9585


Epoch [250/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.87it/s, loss=0.951]


Epoch [250/5000]: Train loss: 1.0497, Valid loss: 1.0248


Epoch [251/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.33it/s, loss=0.967]


Epoch [251/5000]: Train loss: 1.0636, Valid loss: 0.9613


Epoch [252/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.76it/s, loss=1.31]


Epoch [252/5000]: Train loss: 1.0728, Valid loss: 0.9945


Epoch [253/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.46it/s, loss=1.02]


Epoch [253/5000]: Train loss: 1.0610, Valid loss: 0.9602


Epoch [254/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.04it/s, loss=1.05]


Epoch [254/5000]: Train loss: 1.0496, Valid loss: 1.0057


Epoch [255/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.59it/s, loss=0.965]


Epoch [255/5000]: Train loss: 1.0618, Valid loss: 0.9747


Epoch [256/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.10it/s, loss=0.917]


Epoch [256/5000]: Train loss: 1.0555, Valid loss: 0.9617


Epoch [257/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.18it/s, loss=1.06]


Epoch [257/5000]: Train loss: 1.0557, Valid loss: 1.0384


Epoch [258/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.26it/s, loss=1.08]


Epoch [258/5000]: Train loss: 1.0788, Valid loss: 0.9727


Epoch [259/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.43it/s, loss=1.2]


Epoch [259/5000]: Train loss: 1.0729, Valid loss: 0.9590


Epoch [260/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.39it/s, loss=0.943]


Epoch [260/5000]: Train loss: 1.0557, Valid loss: 1.0346


Epoch [261/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.76it/s, loss=0.923]


Epoch [261/5000]: Train loss: 1.0538, Valid loss: 0.9944


Epoch [262/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.37it/s, loss=0.966]


Epoch [262/5000]: Train loss: 1.0504, Valid loss: 0.9633


Epoch [263/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.35it/s, loss=0.912]


Epoch [263/5000]: Train loss: 1.0467, Valid loss: 0.9568


Epoch [264/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.61it/s, loss=1.07]


Epoch [264/5000]: Train loss: 1.0509, Valid loss: 0.9758


Epoch [265/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.88it/s, loss=0.842]


Epoch [265/5000]: Train loss: 1.0433, Valid loss: 0.9535
Saving model with loss 0.953...


Epoch [266/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.11it/s, loss=0.986]


Epoch [266/5000]: Train loss: 1.0527, Valid loss: 0.9879


Epoch [267/5000]: 100%|██████████| 14/14 [00:00<00:00, 123.73it/s, loss=1.03]


Epoch [267/5000]: Train loss: 1.0482, Valid loss: 0.9647


Epoch [268/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.94it/s, loss=1.19]


Epoch [268/5000]: Train loss: 1.0576, Valid loss: 0.9528
Saving model with loss 0.953...


Epoch [269/5000]: 100%|██████████| 14/14 [00:00<00:00, 167.50it/s, loss=1.05]


Epoch [269/5000]: Train loss: 1.0528, Valid loss: 0.9596


Epoch [270/5000]: 100%|██████████| 14/14 [00:00<00:00, 166.07it/s, loss=0.818]


Epoch [270/5000]: Train loss: 1.0426, Valid loss: 0.9693


Epoch [271/5000]: 100%|██████████| 14/14 [00:00<00:00, 159.14it/s, loss=0.973]


Epoch [271/5000]: Train loss: 1.0449, Valid loss: 0.9737


Epoch [272/5000]: 100%|██████████| 14/14 [00:00<00:00, 165.35it/s, loss=0.996]


Epoch [272/5000]: Train loss: 1.0489, Valid loss: 0.9667


Epoch [273/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.05it/s, loss=1.04]


Epoch [273/5000]: Train loss: 1.0485, Valid loss: 0.9598


Epoch [274/5000]: 100%|██████████| 14/14 [00:00<00:00, 159.37it/s, loss=1.03]


Epoch [274/5000]: Train loss: 1.0461, Valid loss: 0.9543


Epoch [275/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.58it/s, loss=1.04]


Epoch [275/5000]: Train loss: 1.0503, Valid loss: 0.9573


Epoch [276/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.26it/s, loss=1.24]


Epoch [276/5000]: Train loss: 1.0623, Valid loss: 1.0086


Epoch [277/5000]: 100%|██████████| 14/14 [00:00<00:00, 172.33it/s, loss=0.87]


Epoch [277/5000]: Train loss: 1.0433, Valid loss: 0.9570


Epoch [278/5000]: 100%|██████████| 14/14 [00:00<00:00, 155.93it/s, loss=1.07]


Epoch [278/5000]: Train loss: 1.0531, Valid loss: 0.9576


Epoch [279/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.45it/s, loss=1.39]


Epoch [279/5000]: Train loss: 1.0684, Valid loss: 1.0075


Epoch [280/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.17it/s, loss=0.918]


Epoch [280/5000]: Train loss: 1.0499, Valid loss: 0.9523
Saving model with loss 0.952...


Epoch [281/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.33it/s, loss=1.16]


Epoch [281/5000]: Train loss: 1.0582, Valid loss: 0.9534


Epoch [282/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.95it/s, loss=1.02]


Epoch [282/5000]: Train loss: 1.0555, Valid loss: 0.9749


Epoch [283/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.45it/s, loss=1.24]


Epoch [283/5000]: Train loss: 1.0664, Valid loss: 0.9553


Epoch [284/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.09it/s, loss=0.97]


Epoch [284/5000]: Train loss: 1.0532, Valid loss: 0.9585


Epoch [285/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.11it/s, loss=1.16]


Epoch [285/5000]: Train loss: 1.0541, Valid loss: 0.9693


Epoch [286/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.81it/s, loss=0.946]


Epoch [286/5000]: Train loss: 1.0458, Valid loss: 0.9959


Epoch [287/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.71it/s, loss=0.864]


Epoch [287/5000]: Train loss: 1.0429, Valid loss: 0.9580


Epoch [288/5000]: 100%|██████████| 14/14 [00:00<00:00, 140.40it/s, loss=0.999]


Epoch [288/5000]: Train loss: 1.0546, Valid loss: 0.9554


Epoch [289/5000]: 100%|██████████| 14/14 [00:00<00:00, 139.68it/s, loss=1.11]


Epoch [289/5000]: Train loss: 1.0517, Valid loss: 0.9577


Epoch [290/5000]: 100%|██████████| 14/14 [00:00<00:00, 144.38it/s, loss=1.14]


Epoch [290/5000]: Train loss: 1.0482, Valid loss: 0.9644


Epoch [291/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.40it/s, loss=1.04]


Epoch [291/5000]: Train loss: 1.0457, Valid loss: 0.9529


Epoch [292/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.37it/s, loss=1.01]


Epoch [292/5000]: Train loss: 1.0503, Valid loss: 0.9505
Saving model with loss 0.951...


Epoch [293/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.86it/s, loss=1.28]


Epoch [293/5000]: Train loss: 1.0713, Valid loss: 1.0552


Epoch [294/5000]: 100%|██████████| 14/14 [00:00<00:00, 173.77it/s, loss=1.06]


Epoch [294/5000]: Train loss: 1.0899, Valid loss: 0.9856


Epoch [295/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.62it/s, loss=1.06]


Epoch [295/5000]: Train loss: 1.0913, Valid loss: 0.9612


Epoch [296/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.35it/s, loss=1.06]


Epoch [296/5000]: Train loss: 1.0666, Valid loss: 0.9916


Epoch [297/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.95it/s, loss=0.992]


Epoch [297/5000]: Train loss: 1.0471, Valid loss: 0.9559


Epoch [298/5000]: 100%|██████████| 14/14 [00:00<00:00, 173.46it/s, loss=0.972]


Epoch [298/5000]: Train loss: 1.0476, Valid loss: 0.9544


Epoch [299/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.41it/s, loss=1]


Epoch [299/5000]: Train loss: 1.0562, Valid loss: 0.9520


Epoch [300/5000]: 100%|██████████| 14/14 [00:00<00:00, 173.52it/s, loss=1.18]


Epoch [300/5000]: Train loss: 1.0639, Valid loss: 0.9504
Saving model with loss 0.950...


Epoch [301/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.51it/s, loss=1.14]


Epoch [301/5000]: Train loss: 1.0533, Valid loss: 0.9472
Saving model with loss 0.947...


Epoch [302/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.19it/s, loss=0.986]


Epoch [302/5000]: Train loss: 1.0452, Valid loss: 0.9547


Epoch [303/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.37it/s, loss=1.2]


Epoch [303/5000]: Train loss: 1.0596, Valid loss: 0.9557


Epoch [304/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.48it/s, loss=0.901]


Epoch [304/5000]: Train loss: 1.0491, Valid loss: 0.9668


Epoch [305/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.72it/s, loss=1.01]


Epoch [305/5000]: Train loss: 1.0464, Valid loss: 0.9446
Saving model with loss 0.945...


Epoch [306/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.86it/s, loss=1.09]


Epoch [306/5000]: Train loss: 1.0600, Valid loss: 0.9829


Epoch [307/5000]: 100%|██████████| 14/14 [00:00<00:00, 175.26it/s, loss=1.03]


Epoch [307/5000]: Train loss: 1.0475, Valid loss: 0.9831


Epoch [308/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.11it/s, loss=1.19]


Epoch [308/5000]: Train loss: 1.0582, Valid loss: 0.9539


Epoch [309/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.88it/s, loss=0.864]


Epoch [309/5000]: Train loss: 1.0443, Valid loss: 0.9512


Epoch [310/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.03it/s, loss=1.12]


Epoch [310/5000]: Train loss: 1.0501, Valid loss: 0.9748


Epoch [311/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.86it/s, loss=0.911]


Epoch [311/5000]: Train loss: 1.0426, Valid loss: 0.9463


Epoch [312/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.41it/s, loss=1.05]


Epoch [312/5000]: Train loss: 1.0471, Valid loss: 0.9461


Epoch [313/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.74it/s, loss=0.902]


Epoch [313/5000]: Train loss: 1.0412, Valid loss: 0.9488


Epoch [314/5000]: 100%|██████████| 14/14 [00:00<00:00, 172.63it/s, loss=1.02]


Epoch [314/5000]: Train loss: 1.0489, Valid loss: 0.9678


Epoch [315/5000]: 100%|██████████| 14/14 [00:00<00:00, 158.13it/s, loss=0.941]


Epoch [315/5000]: Train loss: 1.0404, Valid loss: 0.9446


Epoch [316/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.44it/s, loss=1.07]


Epoch [316/5000]: Train loss: 1.0469, Valid loss: 0.9443
Saving model with loss 0.944...


Epoch [317/5000]: 100%|██████████| 14/14 [00:00<00:00, 158.89it/s, loss=0.946]


Epoch [317/5000]: Train loss: 1.0460, Valid loss: 0.9437
Saving model with loss 0.944...


Epoch [318/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.73it/s, loss=0.983]


Epoch [318/5000]: Train loss: 1.0486, Valid loss: 0.9801


Epoch [319/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.28it/s, loss=1.13]


Epoch [319/5000]: Train loss: 1.0635, Valid loss: 0.9525


Epoch [320/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.63it/s, loss=1.03]


Epoch [320/5000]: Train loss: 1.0626, Valid loss: 0.9443


Epoch [321/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.48it/s, loss=1.05]


Epoch [321/5000]: Train loss: 1.0468, Valid loss: 0.9531


Epoch [322/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.30it/s, loss=1.02]


Epoch [322/5000]: Train loss: 1.0454, Valid loss: 0.9507


Epoch [323/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.31it/s, loss=0.951]


Epoch [323/5000]: Train loss: 1.0541, Valid loss: 0.9573


Epoch [324/5000]: 100%|██████████| 14/14 [00:00<00:00, 158.37it/s, loss=1.08]


Epoch [324/5000]: Train loss: 1.0616, Valid loss: 0.9444


Epoch [325/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.34it/s, loss=0.825]


Epoch [325/5000]: Train loss: 1.0319, Valid loss: 0.9506


Epoch [326/5000]: 100%|██████████| 14/14 [00:00<00:00, 213.32it/s, loss=0.92]


Epoch [326/5000]: Train loss: 1.0420, Valid loss: 0.9424
Saving model with loss 0.942...


Epoch [327/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.20it/s, loss=1.09]


Epoch [327/5000]: Train loss: 1.0463, Valid loss: 0.9544


Epoch [328/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.75it/s, loss=1.28]


Epoch [328/5000]: Train loss: 1.0692, Valid loss: 0.9602


Epoch [329/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.91it/s, loss=0.943]


Epoch [329/5000]: Train loss: 1.0491, Valid loss: 0.9422
Saving model with loss 0.942...


Epoch [330/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.06it/s, loss=1.1]


Epoch [330/5000]: Train loss: 1.0497, Valid loss: 0.9401
Saving model with loss 0.940...


Epoch [331/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.63it/s, loss=1.34]


Epoch [331/5000]: Train loss: 1.0637, Valid loss: 0.9707


Epoch [332/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.16it/s, loss=0.813]


Epoch [332/5000]: Train loss: 1.0387, Valid loss: 1.0246


Epoch [333/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.13it/s, loss=0.958]


Epoch [333/5000]: Train loss: 1.0448, Valid loss: 0.9575


Epoch [334/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.52it/s, loss=0.895]


Epoch [334/5000]: Train loss: 1.0370, Valid loss: 0.9403


Epoch [335/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.62it/s, loss=0.817]


Epoch [335/5000]: Train loss: 1.0379, Valid loss: 0.9615


Epoch [336/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.61it/s, loss=1.12]


Epoch [336/5000]: Train loss: 1.0527, Valid loss: 0.9473


Epoch [337/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.78it/s, loss=1.14]


Epoch [337/5000]: Train loss: 1.0583, Valid loss: 0.9800


Epoch [338/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.35it/s, loss=1.2]


Epoch [338/5000]: Train loss: 1.0693, Valid loss: 0.9444


Epoch [339/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.24it/s, loss=1.05]


Epoch [339/5000]: Train loss: 1.0449, Valid loss: 0.9401


Epoch [340/5000]: 100%|██████████| 14/14 [00:00<00:00, 216.04it/s, loss=1.07]


Epoch [340/5000]: Train loss: 1.0450, Valid loss: 0.9530


Epoch [341/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.97it/s, loss=1.06]


Epoch [341/5000]: Train loss: 1.0558, Valid loss: 0.9441


Epoch [342/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.15it/s, loss=1.14]


Epoch [342/5000]: Train loss: 1.0681, Valid loss: 0.9813


Epoch [343/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.20it/s, loss=0.946]


Epoch [343/5000]: Train loss: 1.0468, Valid loss: 0.9369
Saving model with loss 0.937...


Epoch [344/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.82it/s, loss=0.962]


Epoch [344/5000]: Train loss: 1.0476, Valid loss: 0.9615


Epoch [345/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.22it/s, loss=1.11]


Epoch [345/5000]: Train loss: 1.0522, Valid loss: 1.0043


Epoch [346/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.06it/s, loss=1.11]


Epoch [346/5000]: Train loss: 1.0569, Valid loss: 0.9380


Epoch [347/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.70it/s, loss=1]


Epoch [347/5000]: Train loss: 1.0538, Valid loss: 0.9625


Epoch [348/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.74it/s, loss=0.983]


Epoch [348/5000]: Train loss: 1.0466, Valid loss: 0.9635


Epoch [349/5000]: 100%|██████████| 14/14 [00:00<00:00, 157.79it/s, loss=1.09]


Epoch [349/5000]: Train loss: 1.0476, Valid loss: 0.9489


Epoch [350/5000]: 100%|██████████| 14/14 [00:00<00:00, 175.36it/s, loss=1.27]


Epoch [350/5000]: Train loss: 1.0536, Valid loss: 0.9747


Epoch [351/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.97it/s, loss=0.922]


Epoch [351/5000]: Train loss: 1.0467, Valid loss: 0.9416


Epoch [352/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.92it/s, loss=1.03]


Epoch [352/5000]: Train loss: 1.0541, Valid loss: 0.9363
Saving model with loss 0.936...


Epoch [353/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.86it/s, loss=1.26]


Epoch [353/5000]: Train loss: 1.0566, Valid loss: 0.9534


Epoch [354/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.92it/s, loss=0.948]


Epoch [354/5000]: Train loss: 1.0458, Valid loss: 0.9590


Epoch [355/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.10it/s, loss=1.05]


Epoch [355/5000]: Train loss: 1.0441, Valid loss: 0.9448


Epoch [356/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.27it/s, loss=0.905]


Epoch [356/5000]: Train loss: 1.0400, Valid loss: 0.9407


Epoch [357/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.57it/s, loss=1.14]


Epoch [357/5000]: Train loss: 1.0523, Valid loss: 0.9561


Epoch [358/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.54it/s, loss=1.22]


Epoch [358/5000]: Train loss: 1.0590, Valid loss: 0.9844


Epoch [359/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.79it/s, loss=1.05]


Epoch [359/5000]: Train loss: 1.0637, Valid loss: 0.9405


Epoch [360/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.28it/s, loss=0.915]


Epoch [360/5000]: Train loss: 1.0492, Valid loss: 0.9430


Epoch [361/5000]: 100%|██████████| 14/14 [00:00<00:00, 169.27it/s, loss=0.935]


Epoch [361/5000]: Train loss: 1.0416, Valid loss: 0.9373


Epoch [362/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.06it/s, loss=0.878]


Epoch [362/5000]: Train loss: 1.0510, Valid loss: 1.0177


Epoch [363/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.65it/s, loss=1.11]


Epoch [363/5000]: Train loss: 1.0881, Valid loss: 0.9460


Epoch [364/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.83it/s, loss=1.19]


Epoch [364/5000]: Train loss: 1.0626, Valid loss: 0.9411


Epoch [365/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.06it/s, loss=1.16]


Epoch [365/5000]: Train loss: 1.0492, Valid loss: 0.9661


Epoch [366/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.44it/s, loss=1.12]


Epoch [366/5000]: Train loss: 1.0522, Valid loss: 0.9835


Epoch [367/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.24it/s, loss=0.984]


Epoch [367/5000]: Train loss: 1.0528, Valid loss: 0.9438


Epoch [368/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.97it/s, loss=1.17]


Epoch [368/5000]: Train loss: 1.0535, Valid loss: 0.9457


Epoch [369/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.55it/s, loss=0.899]


Epoch [369/5000]: Train loss: 1.0441, Valid loss: 0.9486


Epoch [370/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.47it/s, loss=0.942]


Epoch [370/5000]: Train loss: 1.0389, Valid loss: 0.9339
Saving model with loss 0.934...


Epoch [371/5000]: 100%|██████████| 14/14 [00:00<00:00, 159.19it/s, loss=1.12]


Epoch [371/5000]: Train loss: 1.0487, Valid loss: 0.9333
Saving model with loss 0.933...


Epoch [372/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.27it/s, loss=0.999]


Epoch [372/5000]: Train loss: 1.0481, Valid loss: 0.9629


Epoch [373/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.94it/s, loss=0.796]


Epoch [373/5000]: Train loss: 1.0340, Valid loss: 0.9400


Epoch [374/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.26it/s, loss=1.07]


Epoch [374/5000]: Train loss: 1.0629, Valid loss: 1.0033


Epoch [375/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.64it/s, loss=0.979]


Epoch [375/5000]: Train loss: 1.0445, Valid loss: 0.9439


Epoch [376/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.05it/s, loss=0.935]


Epoch [376/5000]: Train loss: 1.0478, Valid loss: 0.9475


Epoch [377/5000]: 100%|██████████| 14/14 [00:00<00:00, 218.19it/s, loss=1.07]


Epoch [377/5000]: Train loss: 1.0543, Valid loss: 0.9445


Epoch [378/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.39it/s, loss=1.09]


Epoch [378/5000]: Train loss: 1.0500, Valid loss: 0.9493


Epoch [379/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.56it/s, loss=0.951]


Epoch [379/5000]: Train loss: 1.0420, Valid loss: 0.9414


Epoch [380/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.20it/s, loss=0.974]


Epoch [380/5000]: Train loss: 1.0465, Valid loss: 0.9633


Epoch [381/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.99it/s, loss=1.21]


Epoch [381/5000]: Train loss: 1.0640, Valid loss: 0.9480


Epoch [382/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.59it/s, loss=0.9]


Epoch [382/5000]: Train loss: 1.0481, Valid loss: 0.9461


Epoch [383/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.69it/s, loss=0.996]


Epoch [383/5000]: Train loss: 1.0657, Valid loss: 0.9701


Epoch [384/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.32it/s, loss=1.14]


Epoch [384/5000]: Train loss: 1.0588, Valid loss: 0.9401


Epoch [385/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.99it/s, loss=1.19]


Epoch [385/5000]: Train loss: 1.0597, Valid loss: 0.9375


Epoch [386/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.59it/s, loss=1.04]


Epoch [386/5000]: Train loss: 1.0448, Valid loss: 0.9562


Epoch [387/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.71it/s, loss=1.08]


Epoch [387/5000]: Train loss: 1.0407, Valid loss: 0.9511


Epoch [388/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.57it/s, loss=1.12]


Epoch [388/5000]: Train loss: 1.0453, Valid loss: 0.9481


Epoch [389/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.18it/s, loss=1.06]


Epoch [389/5000]: Train loss: 1.0477, Valid loss: 0.9488


Epoch [390/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.37it/s, loss=0.947]


Epoch [390/5000]: Train loss: 1.0403, Valid loss: 0.9369


Epoch [391/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.79it/s, loss=1.15]


Epoch [391/5000]: Train loss: 1.0529, Valid loss: 0.9451


Epoch [392/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.95it/s, loss=0.914]


Epoch [392/5000]: Train loss: 1.0473, Valid loss: 0.9694


Epoch [393/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.53it/s, loss=1.1]


Epoch [393/5000]: Train loss: 1.0582, Valid loss: 0.9430


Epoch [394/5000]: 100%|██████████| 14/14 [00:00<00:00, 153.49it/s, loss=0.966]


Epoch [394/5000]: Train loss: 1.0480, Valid loss: 0.9463


Epoch [395/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.47it/s, loss=0.893]


Epoch [395/5000]: Train loss: 1.0396, Valid loss: 0.9326
Saving model with loss 0.933...


Epoch [396/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.70it/s, loss=1.05]


Epoch [396/5000]: Train loss: 1.0498, Valid loss: 0.9470


Epoch [397/5000]: 100%|██████████| 14/14 [00:00<00:00, 212.61it/s, loss=0.942]


Epoch [397/5000]: Train loss: 1.0486, Valid loss: 0.9507


Epoch [398/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.63it/s, loss=1.15]


Epoch [398/5000]: Train loss: 1.0525, Valid loss: 0.9847


Epoch [399/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.81it/s, loss=1.25]


Epoch [399/5000]: Train loss: 1.0605, Valid loss: 0.9396


Epoch [400/5000]: 100%|██████████| 14/14 [00:00<00:00, 213.78it/s, loss=1.09]


Epoch [400/5000]: Train loss: 1.0504, Valid loss: 0.9623


Epoch [401/5000]: 100%|██████████| 14/14 [00:00<00:00, 212.78it/s, loss=1.22]


Epoch [401/5000]: Train loss: 1.0597, Valid loss: 0.9327


Epoch [402/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.96it/s, loss=1.3]


Epoch [402/5000]: Train loss: 1.0661, Valid loss: 1.0102


Epoch [403/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.06it/s, loss=0.955]


Epoch [403/5000]: Train loss: 1.0454, Valid loss: 0.9333


Epoch [404/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.61it/s, loss=1.09]


Epoch [404/5000]: Train loss: 1.0491, Valid loss: 0.9330


Epoch [405/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.17it/s, loss=1.2]


Epoch [405/5000]: Train loss: 1.0529, Valid loss: 0.9441


Epoch [406/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.85it/s, loss=0.899]


Epoch [406/5000]: Train loss: 1.0495, Valid loss: 0.9559


Epoch [407/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.65it/s, loss=1.17]


Epoch [407/5000]: Train loss: 1.0525, Valid loss: 0.9357


Epoch [408/5000]: 100%|██████████| 14/14 [00:00<00:00, 160.46it/s, loss=0.952]


Epoch [408/5000]: Train loss: 1.0377, Valid loss: 0.9439


Epoch [409/5000]: 100%|██████████| 14/14 [00:00<00:00, 157.38it/s, loss=1.08]


Epoch [409/5000]: Train loss: 1.0445, Valid loss: 0.9519


Epoch [410/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.88it/s, loss=1.07]


Epoch [410/5000]: Train loss: 1.0525, Valid loss: 0.9412


Epoch [411/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.68it/s, loss=1.04]


Epoch [411/5000]: Train loss: 1.0485, Valid loss: 0.9433


Epoch [412/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.53it/s, loss=1.01]


Epoch [412/5000]: Train loss: 1.0396, Valid loss: 0.9374


Epoch [413/5000]: 100%|██████████| 14/14 [00:00<00:00, 144.77it/s, loss=1.31]


Epoch [413/5000]: Train loss: 1.0581, Valid loss: 0.9401


Epoch [414/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.27it/s, loss=0.972]


Epoch [414/5000]: Train loss: 1.0410, Valid loss: 0.9711


Epoch [415/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.10it/s, loss=0.853]


Epoch [415/5000]: Train loss: 1.0407, Valid loss: 0.9759


Epoch [416/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.48it/s, loss=1.02]


Epoch [416/5000]: Train loss: 1.0467, Valid loss: 0.9339


Epoch [417/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.30it/s, loss=1.24]


Epoch [417/5000]: Train loss: 1.0525, Valid loss: 0.9462


Epoch [418/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.79it/s, loss=0.946]


Epoch [418/5000]: Train loss: 1.0413, Valid loss: 0.9510


Epoch [419/5000]: 100%|██████████| 14/14 [00:00<00:00, 164.64it/s, loss=1.1]


Epoch [419/5000]: Train loss: 1.0491, Valid loss: 0.9409


Epoch [420/5000]: 100%|██████████| 14/14 [00:00<00:00, 166.40it/s, loss=1.06]


Epoch [420/5000]: Train loss: 1.0520, Valid loss: 0.9419


Epoch [421/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.35it/s, loss=0.879]


Epoch [421/5000]: Train loss: 1.0335, Valid loss: 0.9392


Epoch [422/5000]: 100%|██████████| 14/14 [00:00<00:00, 210.61it/s, loss=0.885]


Epoch [422/5000]: Train loss: 1.0395, Valid loss: 0.9461


Epoch [423/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.16it/s, loss=0.902]


Epoch [423/5000]: Train loss: 1.0418, Valid loss: 0.9899


Epoch [424/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.06it/s, loss=0.811]


Epoch [424/5000]: Train loss: 1.0313, Valid loss: 0.9456


Epoch [425/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.09it/s, loss=1.09]


Epoch [425/5000]: Train loss: 1.0493, Valid loss: 0.9738


Epoch [426/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.72it/s, loss=1.05]


Epoch [426/5000]: Train loss: 1.0428, Valid loss: 0.9463


Epoch [427/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.95it/s, loss=1.09]


Epoch [427/5000]: Train loss: 1.0452, Valid loss: 0.9496


Epoch [428/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.37it/s, loss=1.01]


Epoch [428/5000]: Train loss: 1.0437, Valid loss: 1.0215


Epoch [429/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.63it/s, loss=0.91]


Epoch [429/5000]: Train loss: 1.0487, Valid loss: 0.9377


Epoch [430/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.76it/s, loss=1.04]


Epoch [430/5000]: Train loss: 1.0451, Valid loss: 0.9447


Epoch [431/5000]: 100%|██████████| 14/14 [00:00<00:00, 167.18it/s, loss=0.964]


Epoch [431/5000]: Train loss: 1.0410, Valid loss: 0.9684


Epoch [432/5000]: 100%|██████████| 14/14 [00:00<00:00, 166.19it/s, loss=0.939]


Epoch [432/5000]: Train loss: 1.0364, Valid loss: 0.9415


Epoch [433/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.34it/s, loss=1.06]


Epoch [433/5000]: Train loss: 1.0473, Valid loss: 0.9637


Epoch [434/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.23it/s, loss=1.05]


Epoch [434/5000]: Train loss: 1.0429, Valid loss: 0.9657


Epoch [435/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.35it/s, loss=1.16]


Epoch [435/5000]: Train loss: 1.0565, Valid loss: 0.9409


Epoch [436/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.67it/s, loss=1.15]


Epoch [436/5000]: Train loss: 1.0730, Valid loss: 0.9471


Epoch [437/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.37it/s, loss=0.865]


Epoch [437/5000]: Train loss: 1.0532, Valid loss: 1.0185


Epoch [438/5000]: 100%|██████████| 14/14 [00:00<00:00, 170.74it/s, loss=1.08]


Epoch [438/5000]: Train loss: 1.0554, Valid loss: 0.9477


Epoch [439/5000]: 100%|██████████| 14/14 [00:00<00:00, 145.33it/s, loss=1.09]


Epoch [439/5000]: Train loss: 1.0602, Valid loss: 0.9745


Epoch [440/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.13it/s, loss=1.07]


Epoch [440/5000]: Train loss: 1.0525, Valid loss: 0.9426


Epoch [441/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.67it/s, loss=1.09]


Epoch [441/5000]: Train loss: 1.0538, Valid loss: 1.0004


Epoch [442/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.42it/s, loss=1.04]


Epoch [442/5000]: Train loss: 1.0591, Valid loss: 0.9413


Epoch [443/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.50it/s, loss=1.06]


Epoch [443/5000]: Train loss: 1.0526, Valid loss: 0.9552


Epoch [444/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.38it/s, loss=1.09]


Epoch [444/5000]: Train loss: 1.0441, Valid loss: 0.9396


Epoch [445/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.27it/s, loss=0.985]


Epoch [445/5000]: Train loss: 1.0538, Valid loss: 0.9748


Epoch [446/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.01it/s, loss=1.25]


Epoch [446/5000]: Train loss: 1.0622, Valid loss: 0.9375


Epoch [447/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.92it/s, loss=0.862]


Epoch [447/5000]: Train loss: 1.0385, Valid loss: 0.9414


Epoch [448/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.33it/s, loss=1.17]


Epoch [448/5000]: Train loss: 1.0539, Valid loss: 0.9571


Epoch [449/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.05it/s, loss=0.932]


Epoch [449/5000]: Train loss: 1.0418, Valid loss: 0.9418


Epoch [450/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.08it/s, loss=1.19]


Epoch [450/5000]: Train loss: 1.0497, Valid loss: 0.9398


Epoch [451/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.50it/s, loss=1.18]


Epoch [451/5000]: Train loss: 1.0550, Valid loss: 0.9902


Epoch [452/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.19it/s, loss=1.09]


Epoch [452/5000]: Train loss: 1.0468, Valid loss: 0.9441


Epoch [453/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.22it/s, loss=1.3]


Epoch [453/5000]: Train loss: 1.0529, Valid loss: 0.9406


Epoch [454/5000]: 100%|██████████| 14/14 [00:00<00:00, 170.60it/s, loss=1.06]


Epoch [454/5000]: Train loss: 1.0426, Valid loss: 0.9444


Epoch [455/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.97it/s, loss=1.09]


Epoch [455/5000]: Train loss: 1.0512, Valid loss: 0.9791


Epoch [456/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.44it/s, loss=1.32]


Epoch [456/5000]: Train loss: 1.0548, Valid loss: 0.9654


Epoch [457/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.90it/s, loss=1.21]


Epoch [457/5000]: Train loss: 1.0593, Valid loss: 0.9503


Epoch [458/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.13it/s, loss=1.02]


Epoch [458/5000]: Train loss: 1.0460, Valid loss: 0.9948


Epoch [459/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.77it/s, loss=1.15]


Epoch [459/5000]: Train loss: 1.0675, Valid loss: 0.9501


Epoch [460/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.71it/s, loss=1.16]


Epoch [460/5000]: Train loss: 1.0542, Valid loss: 0.9467


Epoch [461/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.95it/s, loss=1.31]


Epoch [461/5000]: Train loss: 1.0623, Valid loss: 0.9565


Epoch [462/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.59it/s, loss=1.15]


Epoch [462/5000]: Train loss: 1.0563, Valid loss: 0.9472


Epoch [463/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.90it/s, loss=1.13]


Epoch [463/5000]: Train loss: 1.0496, Valid loss: 0.9400


Epoch [464/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.16it/s, loss=1.15]


Epoch [464/5000]: Train loss: 1.0484, Valid loss: 0.9567


Epoch [465/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.94it/s, loss=0.939]


Epoch [465/5000]: Train loss: 1.0411, Valid loss: 0.9429


Epoch [466/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.12it/s, loss=1.04]


Epoch [466/5000]: Train loss: 1.0537, Valid loss: 0.9451


Epoch [467/5000]: 100%|██████████| 14/14 [00:00<00:00, 165.64it/s, loss=1.19]


Epoch [467/5000]: Train loss: 1.0459, Valid loss: 0.9549


Epoch [468/5000]: 100%|██████████| 14/14 [00:00<00:00, 163.54it/s, loss=0.914]


Epoch [468/5000]: Train loss: 1.0406, Valid loss: 0.9356


Epoch [469/5000]: 100%|██████████| 14/14 [00:00<00:00, 149.85it/s, loss=0.925]


Epoch [469/5000]: Train loss: 1.0382, Valid loss: 0.9352


Epoch [470/5000]: 100%|██████████| 14/14 [00:00<00:00, 134.44it/s, loss=1.05]


Epoch [470/5000]: Train loss: 1.0442, Valid loss: 0.9316
Saving model with loss 0.932...


Epoch [471/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.89it/s, loss=0.946]


Epoch [471/5000]: Train loss: 1.0495, Valid loss: 0.9540


Epoch [472/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.84it/s, loss=0.985]


Epoch [472/5000]: Train loss: 1.0397, Valid loss: 0.9581


Epoch [473/5000]: 100%|██████████| 14/14 [00:00<00:00, 156.25it/s, loss=0.977]


Epoch [473/5000]: Train loss: 1.0454, Valid loss: 0.9350


Epoch [474/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.01it/s, loss=1.17]


Epoch [474/5000]: Train loss: 1.0516, Valid loss: 0.9351


Epoch [475/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.31it/s, loss=1.06]


Epoch [475/5000]: Train loss: 1.0456, Valid loss: 0.9601


Epoch [476/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.90it/s, loss=1.03]


Epoch [476/5000]: Train loss: 1.0533, Valid loss: 0.9402


Epoch [477/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.29it/s, loss=1.28]


Epoch [477/5000]: Train loss: 1.0608, Valid loss: 0.9389


Epoch [478/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.38it/s, loss=0.752]


Epoch [478/5000]: Train loss: 1.0284, Valid loss: 0.9438


Epoch [479/5000]: 100%|██████████| 14/14 [00:00<00:00, 136.03it/s, loss=1.11]


Epoch [479/5000]: Train loss: 1.0440, Valid loss: 0.9409


Epoch [480/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.96it/s, loss=0.97]


Epoch [480/5000]: Train loss: 1.0428, Valid loss: 0.9398


Epoch [481/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.47it/s, loss=0.953]


Epoch [481/5000]: Train loss: 1.0420, Valid loss: 0.9644


Epoch [482/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.34it/s, loss=1.06]


Epoch [482/5000]: Train loss: 1.0420, Valid loss: 0.9371


Epoch [483/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.13it/s, loss=0.971]


Epoch [483/5000]: Train loss: 1.0380, Valid loss: 0.9480


Epoch [484/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.57it/s, loss=0.955]


Epoch [484/5000]: Train loss: 1.0360, Valid loss: 0.9359


Epoch [485/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.31it/s, loss=1.24]


Epoch [485/5000]: Train loss: 1.0554, Valid loss: 0.9379


Epoch [486/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.74it/s, loss=1.09]


Epoch [486/5000]: Train loss: 1.0451, Valid loss: 0.9369


Epoch [487/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.80it/s, loss=1.02]


Epoch [487/5000]: Train loss: 1.0478, Valid loss: 0.9530


Epoch [488/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.59it/s, loss=1.31]


Epoch [488/5000]: Train loss: 1.0567, Valid loss: 1.0143


Epoch [489/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.04it/s, loss=1.12]


Epoch [489/5000]: Train loss: 1.0506, Valid loss: 0.9405


Epoch [490/5000]: 100%|██████████| 14/14 [00:00<00:00, 168.87it/s, loss=0.882]


Epoch [490/5000]: Train loss: 1.0335, Valid loss: 0.9337


Epoch [491/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.05it/s, loss=0.95]


Epoch [491/5000]: Train loss: 1.0378, Valid loss: 0.9332


Epoch [492/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.23it/s, loss=0.9]


Epoch [492/5000]: Train loss: 1.0368, Valid loss: 0.9574


Epoch [493/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.95it/s, loss=1.17]


Epoch [493/5000]: Train loss: 1.0450, Valid loss: 0.9535


Epoch [494/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.42it/s, loss=1.12]


Epoch [494/5000]: Train loss: 1.0576, Valid loss: 0.9399


Epoch [495/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.94it/s, loss=1.01]


Epoch [495/5000]: Train loss: 1.0447, Valid loss: 0.9403


Epoch [496/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.64it/s, loss=1.06]


Epoch [496/5000]: Train loss: 1.0496, Valid loss: 0.9401


Epoch [497/5000]: 100%|██████████| 14/14 [00:00<00:00, 171.49it/s, loss=0.802]


Epoch [497/5000]: Train loss: 1.0403, Valid loss: 0.9792


Epoch [498/5000]: 100%|██████████| 14/14 [00:00<00:00, 170.62it/s, loss=1.06]


Epoch [498/5000]: Train loss: 1.0554, Valid loss: 0.9317


Epoch [499/5000]: 100%|██████████| 14/14 [00:00<00:00, 146.21it/s, loss=1.09]


Epoch [499/5000]: Train loss: 1.0411, Valid loss: 0.9385


Epoch [500/5000]: 100%|██████████| 14/14 [00:00<00:00, 133.34it/s, loss=1.09]


Epoch [500/5000]: Train loss: 1.0500, Valid loss: 0.9416


Epoch [501/5000]: 100%|██████████| 14/14 [00:00<00:00, 151.04it/s, loss=1.35]


Epoch [501/5000]: Train loss: 1.0540, Valid loss: 0.9313
Saving model with loss 0.931...


Epoch [502/5000]: 100%|██████████| 14/14 [00:00<00:00, 140.23it/s, loss=0.945]


Epoch [502/5000]: Train loss: 1.0333, Valid loss: 0.9404


Epoch [503/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.76it/s, loss=1.01]


Epoch [503/5000]: Train loss: 1.0401, Valid loss: 0.9651


Epoch [504/5000]: 100%|██████████| 14/14 [00:00<00:00, 171.57it/s, loss=1.41]


Epoch [504/5000]: Train loss: 1.0633, Valid loss: 0.9468


Epoch [505/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.70it/s, loss=0.931]


Epoch [505/5000]: Train loss: 1.0521, Valid loss: 0.9398


Epoch [506/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.75it/s, loss=0.937]


Epoch [506/5000]: Train loss: 1.0396, Valid loss: 0.9421


Epoch [507/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.70it/s, loss=0.927]


Epoch [507/5000]: Train loss: 1.0351, Valid loss: 0.9290
Saving model with loss 0.929...


Epoch [508/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.15it/s, loss=0.937]


Epoch [508/5000]: Train loss: 1.0397, Valid loss: 0.9405


Epoch [509/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.56it/s, loss=1.01]


Epoch [509/5000]: Train loss: 1.0409, Valid loss: 0.9787


Epoch [510/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.05it/s, loss=1.13]


Epoch [510/5000]: Train loss: 1.0490, Valid loss: 0.9299


Epoch [511/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.29it/s, loss=0.911]


Epoch [511/5000]: Train loss: 1.0306, Valid loss: 0.9377


Epoch [512/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.24it/s, loss=1.1]


Epoch [512/5000]: Train loss: 1.0405, Valid loss: 0.9455


Epoch [513/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.19it/s, loss=0.937]


Epoch [513/5000]: Train loss: 1.0399, Valid loss: 0.9353


Epoch [514/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.62it/s, loss=1.05]


Epoch [514/5000]: Train loss: 1.0488, Valid loss: 0.9565


Epoch [515/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.14it/s, loss=1.27]


Epoch [515/5000]: Train loss: 1.0568, Valid loss: 0.9412


Epoch [516/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.77it/s, loss=1.48]


Epoch [516/5000]: Train loss: 1.0669, Valid loss: 0.9713


Epoch [517/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.92it/s, loss=0.99]


Epoch [517/5000]: Train loss: 1.0462, Valid loss: 0.9343


Epoch [518/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.65it/s, loss=1.17]


Epoch [518/5000]: Train loss: 1.0472, Valid loss: 0.9443


Epoch [519/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.27it/s, loss=0.972]


Epoch [519/5000]: Train loss: 1.0416, Valid loss: 0.9838


Epoch [520/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.07it/s, loss=1.07]


Epoch [520/5000]: Train loss: 1.0425, Valid loss: 0.9340


Epoch [521/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.23it/s, loss=1.26]


Epoch [521/5000]: Train loss: 1.0595, Valid loss: 0.9557


Epoch [522/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.54it/s, loss=0.94]


Epoch [522/5000]: Train loss: 1.0616, Valid loss: 0.9413


Epoch [523/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.23it/s, loss=1.43]


Epoch [523/5000]: Train loss: 1.0746, Valid loss: 0.9425


Epoch [524/5000]: 100%|██████████| 14/14 [00:00<00:00, 153.76it/s, loss=0.911]


Epoch [524/5000]: Train loss: 1.0387, Valid loss: 0.9800


Epoch [525/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.85it/s, loss=1.1]


Epoch [525/5000]: Train loss: 1.0576, Valid loss: 0.9346


Epoch [526/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.09it/s, loss=1.12]


Epoch [526/5000]: Train loss: 1.0465, Valid loss: 0.9565


Epoch [527/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.83it/s, loss=0.96]


Epoch [527/5000]: Train loss: 1.0407, Valid loss: 0.9331


Epoch [528/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.48it/s, loss=1.08]


Epoch [528/5000]: Train loss: 1.0715, Valid loss: 0.9389


Epoch [529/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.66it/s, loss=0.969]


Epoch [529/5000]: Train loss: 1.0457, Valid loss: 0.9452


Epoch [530/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.87it/s, loss=0.898]


Epoch [530/5000]: Train loss: 1.0348, Valid loss: 0.9364


Epoch [531/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.62it/s, loss=1.01]


Epoch [531/5000]: Train loss: 1.0397, Valid loss: 0.9311


Epoch [532/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.06it/s, loss=1.31]


Epoch [532/5000]: Train loss: 1.0698, Valid loss: 0.9443


Epoch [533/5000]: 100%|██████████| 14/14 [00:00<00:00, 173.17it/s, loss=1]


Epoch [533/5000]: Train loss: 1.0428, Valid loss: 1.0307


Epoch [534/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.68it/s, loss=0.936]


Epoch [534/5000]: Train loss: 1.0503, Valid loss: 0.9628


Epoch [535/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.47it/s, loss=1.31]


Epoch [535/5000]: Train loss: 1.0505, Valid loss: 0.9271
Saving model with loss 0.927...


Epoch [536/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.10it/s, loss=1.15]


Epoch [536/5000]: Train loss: 1.0469, Valid loss: 0.9715


Epoch [537/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.97it/s, loss=0.997]


Epoch [537/5000]: Train loss: 1.0391, Valid loss: 0.9297


Epoch [538/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.24it/s, loss=0.892]


Epoch [538/5000]: Train loss: 1.0350, Valid loss: 0.9311


Epoch [539/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.17it/s, loss=1.23]


Epoch [539/5000]: Train loss: 1.0492, Valid loss: 0.9330


Epoch [540/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.64it/s, loss=0.969]


Epoch [540/5000]: Train loss: 1.0378, Valid loss: 0.9516


Epoch [541/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.82it/s, loss=1.08]


Epoch [541/5000]: Train loss: 1.0462, Valid loss: 0.9250
Saving model with loss 0.925...


Epoch [542/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.41it/s, loss=1.16]


Epoch [542/5000]: Train loss: 1.0433, Valid loss: 0.9585


Epoch [543/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.99it/s, loss=1.16]


Epoch [543/5000]: Train loss: 1.0494, Valid loss: 0.9334


Epoch [544/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.09it/s, loss=0.903]


Epoch [544/5000]: Train loss: 1.0401, Valid loss: 0.9358


Epoch [545/5000]: 100%|██████████| 14/14 [00:00<00:00, 171.44it/s, loss=0.764]


Epoch [545/5000]: Train loss: 1.0349, Valid loss: 0.9351


Epoch [546/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.39it/s, loss=0.905]


Epoch [546/5000]: Train loss: 1.0415, Valid loss: 0.9302


Epoch [547/5000]: 100%|██████████| 14/14 [00:00<00:00, 173.99it/s, loss=1.43]


Epoch [547/5000]: Train loss: 1.0584, Valid loss: 0.9518


Epoch [548/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.73it/s, loss=1.18]


Epoch [548/5000]: Train loss: 1.0494, Valid loss: 0.9308


Epoch [549/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.49it/s, loss=1.07]


Epoch [549/5000]: Train loss: 1.0454, Valid loss: 0.9417


Epoch [550/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.19it/s, loss=1.02]


Epoch [550/5000]: Train loss: 1.0372, Valid loss: 0.9635


Epoch [551/5000]: 100%|██████████| 14/14 [00:00<00:00, 167.71it/s, loss=0.996]


Epoch [551/5000]: Train loss: 1.0416, Valid loss: 0.9189
Saving model with loss 0.919...


Epoch [552/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.48it/s, loss=0.918]


Epoch [552/5000]: Train loss: 1.0446, Valid loss: 0.9478


Epoch [553/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.16it/s, loss=0.784]


Epoch [553/5000]: Train loss: 1.0277, Valid loss: 0.9375


Epoch [554/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.15it/s, loss=1.11]


Epoch [554/5000]: Train loss: 1.0476, Valid loss: 0.9401


Epoch [555/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.14it/s, loss=1.1]


Epoch [555/5000]: Train loss: 1.0478, Valid loss: 0.9450


Epoch [556/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.90it/s, loss=1.35]


Epoch [556/5000]: Train loss: 1.0693, Valid loss: 0.9380


Epoch [557/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.97it/s, loss=1.05]


Epoch [557/5000]: Train loss: 1.0448, Valid loss: 0.9412


Epoch [558/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.59it/s, loss=1.21]


Epoch [558/5000]: Train loss: 1.0464, Valid loss: 0.9354


Epoch [559/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.19it/s, loss=1.24]


Epoch [559/5000]: Train loss: 1.0635, Valid loss: 0.9722


Epoch [560/5000]: 100%|██████████| 14/14 [00:00<00:00, 168.25it/s, loss=0.89]


Epoch [560/5000]: Train loss: 1.0430, Valid loss: 0.9426


Epoch [561/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.26it/s, loss=1.01]


Epoch [561/5000]: Train loss: 1.0609, Valid loss: 0.9654


Epoch [562/5000]: 100%|██████████| 14/14 [00:00<00:00, 160.69it/s, loss=1.29]


Epoch [562/5000]: Train loss: 1.0697, Valid loss: 0.9361


Epoch [563/5000]: 100%|██████████| 14/14 [00:00<00:00, 157.80it/s, loss=1.01]


Epoch [563/5000]: Train loss: 1.0495, Valid loss: 0.9697


Epoch [564/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.83it/s, loss=1.06]


Epoch [564/5000]: Train loss: 1.0648, Valid loss: 0.9910


Epoch [565/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.24it/s, loss=1.02]


Epoch [565/5000]: Train loss: 1.0465, Valid loss: 0.9307


Epoch [566/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.23it/s, loss=1.13]


Epoch [566/5000]: Train loss: 1.0449, Valid loss: 0.9646


Epoch [567/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.30it/s, loss=1]


Epoch [567/5000]: Train loss: 1.0414, Valid loss: 0.9208


Epoch [568/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.99it/s, loss=0.925]


Epoch [568/5000]: Train loss: 1.0366, Valid loss: 0.9317


Epoch [569/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.21it/s, loss=0.919]


Epoch [569/5000]: Train loss: 1.0327, Valid loss: 0.9268


Epoch [570/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.76it/s, loss=1.19]


Epoch [570/5000]: Train loss: 1.0454, Valid loss: 0.9382


Epoch [571/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.90it/s, loss=0.977]


Epoch [571/5000]: Train loss: 1.0426, Valid loss: 0.9401


Epoch [572/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.72it/s, loss=1.06]


Epoch [572/5000]: Train loss: 1.0486, Valid loss: 0.9417


Epoch [573/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.32it/s, loss=1.04]


Epoch [573/5000]: Train loss: 1.0512, Valid loss: 0.9467


Epoch [574/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.27it/s, loss=0.796]


Epoch [574/5000]: Train loss: 1.0326, Valid loss: 0.9297


Epoch [575/5000]: 100%|██████████| 14/14 [00:00<00:00, 172.15it/s, loss=1.08]


Epoch [575/5000]: Train loss: 1.0464, Valid loss: 0.9260


Epoch [576/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.20it/s, loss=1.03]


Epoch [576/5000]: Train loss: 1.0536, Valid loss: 1.0428


Epoch [577/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.33it/s, loss=0.967]


Epoch [577/5000]: Train loss: 1.0462, Valid loss: 0.9256


Epoch [578/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.59it/s, loss=0.871]


Epoch [578/5000]: Train loss: 1.0376, Valid loss: 0.9366


Epoch [579/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.95it/s, loss=1.08]


Epoch [579/5000]: Train loss: 1.0472, Valid loss: 0.9356


Epoch [580/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.65it/s, loss=1.16]


Epoch [580/5000]: Train loss: 1.0455, Valid loss: 0.9343


Epoch [581/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.98it/s, loss=0.883]


Epoch [581/5000]: Train loss: 1.0351, Valid loss: 0.9277


Epoch [582/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.87it/s, loss=1.16]


Epoch [582/5000]: Train loss: 1.0467, Valid loss: 0.9264


Epoch [583/5000]: 100%|██████████| 14/14 [00:00<00:00, 171.87it/s, loss=1.17]


Epoch [583/5000]: Train loss: 1.0470, Valid loss: 0.9569


Epoch [584/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.79it/s, loss=0.815]


Epoch [584/5000]: Train loss: 1.0274, Valid loss: 0.9241


Epoch [585/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.13it/s, loss=1.2]


Epoch [585/5000]: Train loss: 1.0453, Valid loss: 0.9522


Epoch [586/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.13it/s, loss=0.939]


Epoch [586/5000]: Train loss: 1.0368, Valid loss: 0.9218


Epoch [587/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.59it/s, loss=0.983]


Epoch [587/5000]: Train loss: 1.0376, Valid loss: 0.9304


Epoch [588/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.82it/s, loss=1]


Epoch [588/5000]: Train loss: 1.0425, Valid loss: 0.9469


Epoch [589/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.03it/s, loss=0.949]


Epoch [589/5000]: Train loss: 1.0339, Valid loss: 0.9243


Epoch [590/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.04it/s, loss=0.928]


Epoch [590/5000]: Train loss: 1.0368, Valid loss: 0.9315


Epoch [591/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.29it/s, loss=1.21]


Epoch [591/5000]: Train loss: 1.0453, Valid loss: 0.9557


Epoch [592/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.74it/s, loss=1.19]


Epoch [592/5000]: Train loss: 1.0485, Valid loss: 0.9242


Epoch [593/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.41it/s, loss=1.04]


Epoch [593/5000]: Train loss: 1.0437, Valid loss: 0.9236


Epoch [594/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.78it/s, loss=1.18]


Epoch [594/5000]: Train loss: 1.0463, Valid loss: 0.9294


Epoch [595/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.40it/s, loss=1.01]


Epoch [595/5000]: Train loss: 1.0390, Valid loss: 0.9375


Epoch [596/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.63it/s, loss=0.95]


Epoch [596/5000]: Train loss: 1.0362, Valid loss: 0.9271


Epoch [597/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.01it/s, loss=1.15]


Epoch [597/5000]: Train loss: 1.0498, Valid loss: 0.9419


Epoch [598/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.75it/s, loss=1.06]


Epoch [598/5000]: Train loss: 1.0508, Valid loss: 1.0034


Epoch [599/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.08it/s, loss=0.797]


Epoch [599/5000]: Train loss: 1.0316, Valid loss: 0.9311


Epoch [600/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.94it/s, loss=1.05]


Epoch [600/5000]: Train loss: 1.0399, Valid loss: 0.9329


Epoch [601/5000]: 100%|██████████| 14/14 [00:00<00:00, 146.49it/s, loss=1.11]


Epoch [601/5000]: Train loss: 1.0427, Valid loss: 0.9597


Epoch [602/5000]: 100%|██████████| 14/14 [00:00<00:00, 135.46it/s, loss=0.879]


Epoch [602/5000]: Train loss: 1.0310, Valid loss: 0.9347


Epoch [603/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.46it/s, loss=1.16]


Epoch [603/5000]: Train loss: 1.0406, Valid loss: 0.9592


Epoch [604/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.06it/s, loss=1.07]


Epoch [604/5000]: Train loss: 1.0518, Valid loss: 0.9380


Epoch [605/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.09it/s, loss=1.09]


Epoch [605/5000]: Train loss: 1.0418, Valid loss: 0.9393


Epoch [606/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.39it/s, loss=1.03]


Epoch [606/5000]: Train loss: 1.0433, Valid loss: 0.9184
Saving model with loss 0.918...


Epoch [607/5000]: 100%|██████████| 14/14 [00:00<00:00, 155.74it/s, loss=1.2]


Epoch [607/5000]: Train loss: 1.0531, Valid loss: 0.9632


Epoch [608/5000]: 100%|██████████| 14/14 [00:00<00:00, 165.30it/s, loss=0.839]


Epoch [608/5000]: Train loss: 1.0323, Valid loss: 0.9358


Epoch [609/5000]: 100%|██████████| 14/14 [00:00<00:00, 157.46it/s, loss=0.957]


Epoch [609/5000]: Train loss: 1.0351, Valid loss: 0.9325


Epoch [610/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.50it/s, loss=0.957]


Epoch [610/5000]: Train loss: 1.0352, Valid loss: 0.9252


Epoch [611/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.64it/s, loss=0.9]


Epoch [611/5000]: Train loss: 1.0366, Valid loss: 0.9694


Epoch [612/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.58it/s, loss=0.903]


Epoch [612/5000]: Train loss: 1.0346, Valid loss: 0.9286


Epoch [613/5000]: 100%|██████████| 14/14 [00:00<00:00, 158.15it/s, loss=0.963]


Epoch [613/5000]: Train loss: 1.0352, Valid loss: 0.9242


Epoch [614/5000]: 100%|██████████| 14/14 [00:00<00:00, 169.01it/s, loss=1.39]


Epoch [614/5000]: Train loss: 1.0597, Valid loss: 0.9737


Epoch [615/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.32it/s, loss=0.922]


Epoch [615/5000]: Train loss: 1.0362, Valid loss: 0.9277


Epoch [616/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.44it/s, loss=1.1]


Epoch [616/5000]: Train loss: 1.0503, Valid loss: 0.9389


Epoch [617/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.19it/s, loss=0.988]


Epoch [617/5000]: Train loss: 1.0360, Valid loss: 0.9362


Epoch [618/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.82it/s, loss=0.979]


Epoch [618/5000]: Train loss: 1.0353, Valid loss: 0.9930


Epoch [619/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.78it/s, loss=0.972]


Epoch [619/5000]: Train loss: 1.0492, Valid loss: 0.9234


Epoch [620/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.86it/s, loss=1.04]


Epoch [620/5000]: Train loss: 1.0540, Valid loss: 0.9367


Epoch [621/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.55it/s, loss=1.01]


Epoch [621/5000]: Train loss: 1.0533, Valid loss: 0.9803


Epoch [622/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.09it/s, loss=1.07]


Epoch [622/5000]: Train loss: 1.0655, Valid loss: 0.9454


Epoch [623/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.61it/s, loss=0.985]


Epoch [623/5000]: Train loss: 1.0488, Valid loss: 0.9293


Epoch [624/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.89it/s, loss=0.969]


Epoch [624/5000]: Train loss: 1.0369, Valid loss: 0.9398


Epoch [625/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.49it/s, loss=1.33]


Epoch [625/5000]: Train loss: 1.0726, Valid loss: 0.9696


Epoch [626/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.25it/s, loss=1.05]


Epoch [626/5000]: Train loss: 1.0393, Valid loss: 0.9154
Saving model with loss 0.915...


Epoch [627/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.63it/s, loss=1.19]


Epoch [627/5000]: Train loss: 1.0470, Valid loss: 0.9513


Epoch [628/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.77it/s, loss=0.889]


Epoch [628/5000]: Train loss: 1.0259, Valid loss: 0.9325


Epoch [629/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.31it/s, loss=1.05]


Epoch [629/5000]: Train loss: 1.0416, Valid loss: 0.9361


Epoch [630/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.67it/s, loss=1.01]


Epoch [630/5000]: Train loss: 1.0427, Valid loss: 0.9287


Epoch [631/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.39it/s, loss=0.892]


Epoch [631/5000]: Train loss: 1.0345, Valid loss: 0.9624


Epoch [632/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.67it/s, loss=0.986]


Epoch [632/5000]: Train loss: 1.0386, Valid loss: 0.9378


Epoch [633/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.17it/s, loss=1.09]


Epoch [633/5000]: Train loss: 1.0364, Valid loss: 0.9560


Epoch [634/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.59it/s, loss=1.03]


Epoch [634/5000]: Train loss: 1.0385, Valid loss: 0.9303


Epoch [635/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.22it/s, loss=0.882]


Epoch [635/5000]: Train loss: 1.0311, Valid loss: 0.9298


Epoch [636/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.94it/s, loss=0.98]


Epoch [636/5000]: Train loss: 1.0348, Valid loss: 0.9273


Epoch [637/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.43it/s, loss=0.855]


Epoch [637/5000]: Train loss: 1.0321, Valid loss: 0.9462


Epoch [638/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.15it/s, loss=0.904]


Epoch [638/5000]: Train loss: 1.0406, Valid loss: 0.9284


Epoch [639/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.88it/s, loss=1.04]


Epoch [639/5000]: Train loss: 1.0389, Valid loss: 0.9320


Epoch [640/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.82it/s, loss=0.835]


Epoch [640/5000]: Train loss: 1.0294, Valid loss: 0.9115
Saving model with loss 0.911...


Epoch [641/5000]: 100%|██████████| 14/14 [00:00<00:00, 151.72it/s, loss=0.906]


Epoch [641/5000]: Train loss: 1.0319, Valid loss: 0.9270


Epoch [642/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.27it/s, loss=1.15]


Epoch [642/5000]: Train loss: 1.0526, Valid loss: 0.9403


Epoch [643/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.28it/s, loss=1.14]


Epoch [643/5000]: Train loss: 1.0401, Valid loss: 0.9275


Epoch [644/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.77it/s, loss=0.964]


Epoch [644/5000]: Train loss: 1.0397, Valid loss: 0.9283


Epoch [645/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.01it/s, loss=1.18]


Epoch [645/5000]: Train loss: 1.0424, Valid loss: 0.9369


Epoch [646/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.09it/s, loss=1.11]


Epoch [646/5000]: Train loss: 1.0473, Valid loss: 0.9195


Epoch [647/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.71it/s, loss=1.24]


Epoch [647/5000]: Train loss: 1.0553, Valid loss: 0.9354


Epoch [648/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.23it/s, loss=1.27]


Epoch [648/5000]: Train loss: 1.0556, Valid loss: 0.9288


Epoch [649/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.81it/s, loss=0.984]


Epoch [649/5000]: Train loss: 1.0398, Valid loss: 0.9256


Epoch [650/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.91it/s, loss=1.23]


Epoch [650/5000]: Train loss: 1.0460, Valid loss: 0.9666


Epoch [651/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.71it/s, loss=0.903]


Epoch [651/5000]: Train loss: 1.0315, Valid loss: 0.9219


Epoch [652/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.88it/s, loss=0.949]


Epoch [652/5000]: Train loss: 1.0367, Valid loss: 0.9197


Epoch [653/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.03it/s, loss=0.874]


Epoch [653/5000]: Train loss: 1.0313, Valid loss: 0.9240


Epoch [654/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.67it/s, loss=0.967]


Epoch [654/5000]: Train loss: 1.0455, Valid loss: 0.9351


Epoch [655/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.08it/s, loss=1.18]


Epoch [655/5000]: Train loss: 1.0443, Valid loss: 0.9248


Epoch [656/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.78it/s, loss=1.18]


Epoch [656/5000]: Train loss: 1.0426, Valid loss: 0.9199


Epoch [657/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.34it/s, loss=0.908]


Epoch [657/5000]: Train loss: 1.0370, Valid loss: 0.9607


Epoch [658/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.82it/s, loss=1.04]


Epoch [658/5000]: Train loss: 1.0449, Valid loss: 0.9297


Epoch [659/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.88it/s, loss=1.12]


Epoch [659/5000]: Train loss: 1.0603, Valid loss: 0.9403


Epoch [660/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.09it/s, loss=0.907]


Epoch [660/5000]: Train loss: 1.0309, Valid loss: 0.9329


Epoch [661/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.97it/s, loss=0.969]


Epoch [661/5000]: Train loss: 1.0527, Valid loss: 0.9272


Epoch [662/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.65it/s, loss=0.929]


Epoch [662/5000]: Train loss: 1.0365, Valid loss: 0.9309


Epoch [663/5000]: 100%|██████████| 14/14 [00:00<00:00, 170.33it/s, loss=1.07]


Epoch [663/5000]: Train loss: 1.0401, Valid loss: 0.9235


Epoch [664/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.75it/s, loss=1]


Epoch [664/5000]: Train loss: 1.0402, Valid loss: 0.9512


Epoch [665/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.08it/s, loss=0.949]


Epoch [665/5000]: Train loss: 1.0639, Valid loss: 0.9620


Epoch [666/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.01it/s, loss=0.97]


Epoch [666/5000]: Train loss: 1.0436, Valid loss: 0.9264


Epoch [667/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.14it/s, loss=0.961]


Epoch [667/5000]: Train loss: 1.0444, Valid loss: 0.9191


Epoch [668/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.41it/s, loss=1.07]


Epoch [668/5000]: Train loss: 1.0410, Valid loss: 0.9425


Epoch [669/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.24it/s, loss=1.1]


Epoch [669/5000]: Train loss: 1.0614, Valid loss: 0.9243


Epoch [670/5000]: 100%|██████████| 14/14 [00:00<00:00, 173.15it/s, loss=1.29]


Epoch [670/5000]: Train loss: 1.0500, Valid loss: 0.9326


Epoch [671/5000]: 100%|██████████| 14/14 [00:00<00:00, 145.17it/s, loss=1.33]


Epoch [671/5000]: Train loss: 1.0503, Valid loss: 0.9247


Epoch [672/5000]: 100%|██████████| 14/14 [00:00<00:00, 163.75it/s, loss=1.36]


Epoch [672/5000]: Train loss: 1.0595, Valid loss: 0.9333


Epoch [673/5000]: 100%|██████████| 14/14 [00:00<00:00, 117.35it/s, loss=0.837]


Epoch [673/5000]: Train loss: 1.0267, Valid loss: 0.9596


Epoch [674/5000]: 100%|██████████| 14/14 [00:00<00:00, 146.54it/s, loss=1.1]


Epoch [674/5000]: Train loss: 1.0562, Valid loss: 0.9371


Epoch [675/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.51it/s, loss=1.15]


Epoch [675/5000]: Train loss: 1.0639, Valid loss: 0.9259


Epoch [676/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.43it/s, loss=0.836]


Epoch [676/5000]: Train loss: 1.0275, Valid loss: 0.9276


Epoch [677/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.68it/s, loss=1.05]


Epoch [677/5000]: Train loss: 1.0393, Valid loss: 0.9275


Epoch [678/5000]: 100%|██████████| 14/14 [00:00<00:00, 162.62it/s, loss=0.989]


Epoch [678/5000]: Train loss: 1.0393, Valid loss: 0.9225


Epoch [679/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.66it/s, loss=1.28]


Epoch [679/5000]: Train loss: 1.0482, Valid loss: 0.9487


Epoch [680/5000]: 100%|██████████| 14/14 [00:00<00:00, 172.92it/s, loss=0.808]


Epoch [680/5000]: Train loss: 1.0347, Valid loss: 0.9177


Epoch [681/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.69it/s, loss=1.06]


Epoch [681/5000]: Train loss: 1.0379, Valid loss: 0.9165


Epoch [682/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.94it/s, loss=0.991]


Epoch [682/5000]: Train loss: 1.0333, Valid loss: 0.9302


Epoch [683/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.03it/s, loss=1.05]


Epoch [683/5000]: Train loss: 1.0410, Valid loss: 0.9186


Epoch [684/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.55it/s, loss=0.998]


Epoch [684/5000]: Train loss: 1.0346, Valid loss: 0.9391


Epoch [685/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.40it/s, loss=0.975]


Epoch [685/5000]: Train loss: 1.0380, Valid loss: 0.9235


Epoch [686/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.25it/s, loss=1.24]


Epoch [686/5000]: Train loss: 1.0475, Valid loss: 0.9300


Epoch [687/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.66it/s, loss=0.908]


Epoch [687/5000]: Train loss: 1.0378, Valid loss: 0.9204


Epoch [688/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.66it/s, loss=1.15]


Epoch [688/5000]: Train loss: 1.0469, Valid loss: 0.9238


Epoch [689/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.21it/s, loss=1.08]


Epoch [689/5000]: Train loss: 1.0382, Valid loss: 0.9443


Epoch [690/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.22it/s, loss=1.01]


Epoch [690/5000]: Train loss: 1.0412, Valid loss: 0.9230


Epoch [691/5000]: 100%|██████████| 14/14 [00:00<00:00, 165.99it/s, loss=0.999]


Epoch [691/5000]: Train loss: 1.0373, Valid loss: 0.9268


Epoch [692/5000]: 100%|██████████| 14/14 [00:00<00:00, 171.86it/s, loss=1.14]


Epoch [692/5000]: Train loss: 1.0425, Valid loss: 0.9515


Epoch [693/5000]: 100%|██████████| 14/14 [00:00<00:00, 152.94it/s, loss=0.912]


Epoch [693/5000]: Train loss: 1.0299, Valid loss: 0.9215


Epoch [694/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.37it/s, loss=1.09]


Epoch [694/5000]: Train loss: 1.0404, Valid loss: 0.9436


Epoch [695/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.14it/s, loss=0.854]


Epoch [695/5000]: Train loss: 1.0303, Valid loss: 0.9803


Epoch [696/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.99it/s, loss=0.941]


Epoch [696/5000]: Train loss: 1.0410, Valid loss: 0.9629


Epoch [697/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.44it/s, loss=1.13]


Epoch [697/5000]: Train loss: 1.0482, Valid loss: 0.9288


Epoch [698/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.86it/s, loss=1.11]


Epoch [698/5000]: Train loss: 1.0517, Valid loss: 0.9748


Epoch [699/5000]: 100%|██████████| 14/14 [00:00<00:00, 164.67it/s, loss=0.914]


Epoch [699/5000]: Train loss: 1.0414, Valid loss: 0.9267


Epoch [700/5000]: 100%|██████████| 14/14 [00:00<00:00, 164.02it/s, loss=0.881]


Epoch [700/5000]: Train loss: 1.0305, Valid loss: 0.9219


Epoch [701/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.12it/s, loss=0.912]


Epoch [701/5000]: Train loss: 1.0301, Valid loss: 0.9332


Epoch [702/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.65it/s, loss=0.933]


Epoch [702/5000]: Train loss: 1.0321, Valid loss: 0.9164


Epoch [703/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.69it/s, loss=0.802]


Epoch [703/5000]: Train loss: 1.0263, Valid loss: 0.9287


Epoch [704/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.85it/s, loss=0.874]


Epoch [704/5000]: Train loss: 1.0272, Valid loss: 0.9263


Epoch [705/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.85it/s, loss=0.97]


Epoch [705/5000]: Train loss: 1.0342, Valid loss: 0.9499


Epoch [706/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.98it/s, loss=1.33]


Epoch [706/5000]: Train loss: 1.0584, Valid loss: 0.9217


Epoch [707/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.40it/s, loss=0.896]


Epoch [707/5000]: Train loss: 1.0413, Valid loss: 0.9860


Epoch [708/5000]: 100%|██████████| 14/14 [00:00<00:00, 170.99it/s, loss=0.887]


Epoch [708/5000]: Train loss: 1.0403, Valid loss: 0.9225


Epoch [709/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.83it/s, loss=1.07]


Epoch [709/5000]: Train loss: 1.0394, Valid loss: 0.9155


Epoch [710/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.48it/s, loss=1.55]


Epoch [710/5000]: Train loss: 1.0547, Valid loss: 0.9427


Epoch [711/5000]: 100%|██████████| 14/14 [00:00<00:00, 140.48it/s, loss=0.996]


Epoch [711/5000]: Train loss: 1.0361, Valid loss: 0.9220


Epoch [712/5000]: 100%|██████████| 14/14 [00:00<00:00, 140.02it/s, loss=1.07]


Epoch [712/5000]: Train loss: 1.0387, Valid loss: 0.9281


Epoch [713/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.20it/s, loss=0.879]


Epoch [713/5000]: Train loss: 1.0321, Valid loss: 0.9295


Epoch [714/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.78it/s, loss=1.12]


Epoch [714/5000]: Train loss: 1.0419, Valid loss: 0.9242


Epoch [715/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.62it/s, loss=1.16]


Epoch [715/5000]: Train loss: 1.0440, Valid loss: 0.9541


Epoch [716/5000]: 100%|██████████| 14/14 [00:00<00:00, 149.82it/s, loss=0.957]


Epoch [716/5000]: Train loss: 1.0398, Valid loss: 0.9262


Epoch [717/5000]: 100%|██████████| 14/14 [00:00<00:00, 137.14it/s, loss=0.947]


Epoch [717/5000]: Train loss: 1.0326, Valid loss: 0.9223


Epoch [718/5000]: 100%|██████████| 14/14 [00:00<00:00, 151.32it/s, loss=1.06]


Epoch [718/5000]: Train loss: 1.0397, Valid loss: 0.9310


Epoch [719/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.94it/s, loss=0.981]


Epoch [719/5000]: Train loss: 1.0335, Valid loss: 0.9250


Epoch [720/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.63it/s, loss=0.856]


Epoch [720/5000]: Train loss: 1.0233, Valid loss: 0.9292


Epoch [721/5000]: 100%|██████████| 14/14 [00:00<00:00, 164.31it/s, loss=1.26]


Epoch [721/5000]: Train loss: 1.0513, Valid loss: 0.9250


Epoch [722/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.49it/s, loss=1.01]


Epoch [722/5000]: Train loss: 1.0347, Valid loss: 0.9293


Epoch [723/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.48it/s, loss=1.18]


Epoch [723/5000]: Train loss: 1.0421, Valid loss: 0.9292


Epoch [724/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.52it/s, loss=0.749]


Epoch [724/5000]: Train loss: 1.0269, Valid loss: 0.9260


Epoch [725/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.25it/s, loss=0.837]


Epoch [725/5000]: Train loss: 1.0276, Valid loss: 0.9222


Epoch [726/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.20it/s, loss=1.16]


Epoch [726/5000]: Train loss: 1.0513, Valid loss: 0.9237


Epoch [727/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.31it/s, loss=1.12]


Epoch [727/5000]: Train loss: 1.0391, Valid loss: 0.9272


Epoch [728/5000]: 100%|██████████| 14/14 [00:00<00:00, 143.80it/s, loss=1.04]


Epoch [728/5000]: Train loss: 1.0359, Valid loss: 0.9344


Epoch [729/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.79it/s, loss=0.962]


Epoch [729/5000]: Train loss: 1.0385, Valid loss: 0.9209


Epoch [730/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.90it/s, loss=1.51]


Epoch [730/5000]: Train loss: 1.0568, Valid loss: 0.9289


Epoch [731/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.91it/s, loss=0.921]


Epoch [731/5000]: Train loss: 1.0592, Valid loss: 0.9293


Epoch [732/5000]: 100%|██████████| 14/14 [00:00<00:00, 158.36it/s, loss=0.979]


Epoch [732/5000]: Train loss: 1.0406, Valid loss: 0.9572


Epoch [733/5000]: 100%|██████████| 14/14 [00:00<00:00, 164.92it/s, loss=1.2]


Epoch [733/5000]: Train loss: 1.0408, Valid loss: 0.9241


Epoch [734/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.92it/s, loss=1.11]


Epoch [734/5000]: Train loss: 1.0510, Valid loss: 0.9254


Epoch [735/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.22it/s, loss=1.13]


Epoch [735/5000]: Train loss: 1.0412, Valid loss: 0.9716


Epoch [736/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.23it/s, loss=1.15]


Epoch [736/5000]: Train loss: 1.0416, Valid loss: 0.9187


Epoch [737/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.03it/s, loss=0.884]


Epoch [737/5000]: Train loss: 1.0313, Valid loss: 0.9231


Epoch [738/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.48it/s, loss=1.18]


Epoch [738/5000]: Train loss: 1.0546, Valid loss: 0.9229


Epoch [739/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.38it/s, loss=0.926]


Epoch [739/5000]: Train loss: 1.0377, Valid loss: 0.9641


Epoch [740/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.33it/s, loss=0.929]


Epoch [740/5000]: Train loss: 1.0439, Valid loss: 0.9258


Epoch [741/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.27it/s, loss=0.951]


Epoch [741/5000]: Train loss: 1.0429, Valid loss: 0.9280


Epoch [742/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.75it/s, loss=0.977]


Epoch [742/5000]: Train loss: 1.0426, Valid loss: 0.9592


Epoch [743/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.10it/s, loss=1.2]


Epoch [743/5000]: Train loss: 1.0399, Valid loss: 0.9196


Epoch [744/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.01it/s, loss=1.04]


Epoch [744/5000]: Train loss: 1.0358, Valid loss: 0.9378


Epoch [745/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.22it/s, loss=1.13]


Epoch [745/5000]: Train loss: 1.0408, Valid loss: 0.9180


Epoch [746/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.79it/s, loss=0.817]


Epoch [746/5000]: Train loss: 1.0269, Valid loss: 0.9346


Epoch [747/5000]: 100%|██████████| 14/14 [00:00<00:00, 154.46it/s, loss=0.844]


Epoch [747/5000]: Train loss: 1.0273, Valid loss: 0.9462


Epoch [748/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.32it/s, loss=1.15]


Epoch [748/5000]: Train loss: 1.0397, Valid loss: 0.9219


Epoch [749/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.88it/s, loss=1.16]


Epoch [749/5000]: Train loss: 1.0534, Valid loss: 0.9401


Epoch [750/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.11it/s, loss=0.93]


Epoch [750/5000]: Train loss: 1.0469, Valid loss: 0.9275


Epoch [751/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.23it/s, loss=1.28]


Epoch [751/5000]: Train loss: 1.0545, Valid loss: 0.9250


Epoch [752/5000]: 100%|██████████| 14/14 [00:00<00:00, 172.53it/s, loss=0.917]


Epoch [752/5000]: Train loss: 1.0253, Valid loss: 0.9216


Epoch [753/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.63it/s, loss=0.791]


Epoch [753/5000]: Train loss: 1.0288, Valid loss: 0.9339


Epoch [754/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.11it/s, loss=0.982]


Epoch [754/5000]: Train loss: 1.0427, Valid loss: 0.9350


Epoch [755/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.55it/s, loss=1.05]


Epoch [755/5000]: Train loss: 1.0550, Valid loss: 0.9199


Epoch [756/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.51it/s, loss=0.795]


Epoch [756/5000]: Train loss: 1.0292, Valid loss: 0.9426


Epoch [757/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.15it/s, loss=1.13]


Epoch [757/5000]: Train loss: 1.0450, Valid loss: 0.9321


Epoch [758/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.79it/s, loss=1.1]


Epoch [758/5000]: Train loss: 1.0462, Valid loss: 0.9173


Epoch [759/5000]: 100%|██████████| 14/14 [00:00<00:00, 156.68it/s, loss=0.971]


Epoch [759/5000]: Train loss: 1.0396, Valid loss: 0.9559


Epoch [760/5000]: 100%|██████████| 14/14 [00:00<00:00, 145.25it/s, loss=1.09]


Epoch [760/5000]: Train loss: 1.0494, Valid loss: 0.9168


Epoch [761/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.23it/s, loss=1.13]


Epoch [761/5000]: Train loss: 1.0438, Valid loss: 0.9334


Epoch [762/5000]: 100%|██████████| 14/14 [00:00<00:00, 163.30it/s, loss=0.884]


Epoch [762/5000]: Train loss: 1.0387, Valid loss: 0.9364


Epoch [763/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.91it/s, loss=1.23]


Epoch [763/5000]: Train loss: 1.0429, Valid loss: 0.9318


Epoch [764/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.28it/s, loss=1.11]


Epoch [764/5000]: Train loss: 1.0360, Valid loss: 0.9185


Epoch [765/5000]: 100%|██████████| 14/14 [00:00<00:00, 210.45it/s, loss=1.05]


Epoch [765/5000]: Train loss: 1.0420, Valid loss: 0.9326


Epoch [766/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.38it/s, loss=0.947]


Epoch [766/5000]: Train loss: 1.0317, Valid loss: 0.9319


Epoch [767/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.10it/s, loss=0.972]


Epoch [767/5000]: Train loss: 1.0292, Valid loss: 0.9255


Epoch [768/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.60it/s, loss=1.13]


Epoch [768/5000]: Train loss: 1.0426, Valid loss: 0.9289


Epoch [769/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.42it/s, loss=0.869]


Epoch [769/5000]: Train loss: 1.0307, Valid loss: 0.9508


Epoch [770/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.90it/s, loss=0.959]


Epoch [770/5000]: Train loss: 1.0306, Valid loss: 0.9383


Epoch [771/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.12it/s, loss=1.11]


Epoch [771/5000]: Train loss: 1.0591, Valid loss: 0.9535


Epoch [772/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.44it/s, loss=1.03]


Epoch [772/5000]: Train loss: 1.0371, Valid loss: 0.9316


Epoch [773/5000]: 100%|██████████| 14/14 [00:00<00:00, 166.75it/s, loss=1.1]


Epoch [773/5000]: Train loss: 1.0442, Valid loss: 0.9509


Epoch [774/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.59it/s, loss=1.26]


Epoch [774/5000]: Train loss: 1.0607, Valid loss: 0.9281


Epoch [775/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.75it/s, loss=1.03]


Epoch [775/5000]: Train loss: 1.0474, Valid loss: 0.9411


Epoch [776/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.47it/s, loss=0.932]


Epoch [776/5000]: Train loss: 1.0309, Valid loss: 0.9174


Epoch [777/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.53it/s, loss=0.857]


Epoch [777/5000]: Train loss: 1.0283, Valid loss: 0.9567


Epoch [778/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.08it/s, loss=1.25]


Epoch [778/5000]: Train loss: 1.0476, Valid loss: 0.9192


Epoch [779/5000]: 100%|██████████| 14/14 [00:00<00:00, 158.74it/s, loss=1.15]


Epoch [779/5000]: Train loss: 1.0542, Valid loss: 0.9215


Epoch [780/5000]: 100%|██████████| 14/14 [00:00<00:00, 151.50it/s, loss=1.15]


Epoch [780/5000]: Train loss: 1.0421, Valid loss: 0.9434


Epoch [781/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.71it/s, loss=0.944]


Epoch [781/5000]: Train loss: 1.0312, Valid loss: 0.9544


Epoch [782/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.83it/s, loss=0.955]


Epoch [782/5000]: Train loss: 1.0370, Valid loss: 0.9349


Epoch [783/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.69it/s, loss=1.16]


Epoch [783/5000]: Train loss: 1.0574, Valid loss: 0.9473


Epoch [784/5000]: 100%|██████████| 14/14 [00:00<00:00, 175.06it/s, loss=1.17]


Epoch [784/5000]: Train loss: 1.0414, Valid loss: 0.9279


Epoch [785/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.93it/s, loss=0.875]


Epoch [785/5000]: Train loss: 1.0373, Valid loss: 0.9350


Epoch [786/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.21it/s, loss=1.05]


Epoch [786/5000]: Train loss: 1.0364, Valid loss: 0.9219


Epoch [787/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.82it/s, loss=0.893]


Epoch [787/5000]: Train loss: 1.0364, Valid loss: 0.9302


Epoch [788/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.89it/s, loss=1.01]


Epoch [788/5000]: Train loss: 1.0394, Valid loss: 0.9392


Epoch [789/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.67it/s, loss=0.884]


Epoch [789/5000]: Train loss: 1.0263, Valid loss: 0.9149


Epoch [790/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.63it/s, loss=1.37]


Epoch [790/5000]: Train loss: 1.0580, Valid loss: 0.9256


Epoch [791/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.62it/s, loss=1.09]


Epoch [791/5000]: Train loss: 1.0378, Valid loss: 0.9188


Epoch [792/5000]: 100%|██████████| 14/14 [00:00<00:00, 211.06it/s, loss=1.04]


Epoch [792/5000]: Train loss: 1.0480, Valid loss: 0.9697


Epoch [793/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.95it/s, loss=0.929]


Epoch [793/5000]: Train loss: 1.0337, Valid loss: 0.9215


Epoch [794/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.07it/s, loss=0.959]


Epoch [794/5000]: Train loss: 1.0406, Valid loss: 0.9301


Epoch [795/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.15it/s, loss=1.02]


Epoch [795/5000]: Train loss: 1.0394, Valid loss: 0.9418


Epoch [796/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.07it/s, loss=1.08]


Epoch [796/5000]: Train loss: 1.0428, Valid loss: 0.9320


Epoch [797/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.40it/s, loss=1.02]


Epoch [797/5000]: Train loss: 1.0442, Valid loss: 0.9295


Epoch [798/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.39it/s, loss=1.14]


Epoch [798/5000]: Train loss: 1.0494, Valid loss: 0.9855


Epoch [799/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.19it/s, loss=0.776]


Epoch [799/5000]: Train loss: 1.0334, Valid loss: 0.9239


Epoch [800/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.86it/s, loss=0.896]


Epoch [800/5000]: Train loss: 1.0458, Valid loss: 0.9228


Epoch [801/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.87it/s, loss=0.866]


Epoch [801/5000]: Train loss: 1.0654, Valid loss: 0.9992


Epoch [802/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.09it/s, loss=1.19]


Epoch [802/5000]: Train loss: 1.0521, Valid loss: 0.9195


Epoch [803/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.95it/s, loss=1.04]


Epoch [803/5000]: Train loss: 1.0361, Valid loss: 0.9311


Epoch [804/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.88it/s, loss=1.3]


Epoch [804/5000]: Train loss: 1.0554, Valid loss: 0.9730


Epoch [805/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.60it/s, loss=0.938]


Epoch [805/5000]: Train loss: 1.0326, Valid loss: 0.9121


Epoch [806/5000]: 100%|██████████| 14/14 [00:00<00:00, 150.50it/s, loss=1.11]


Epoch [806/5000]: Train loss: 1.0376, Valid loss: 0.9517


Epoch [807/5000]: 100%|██████████| 14/14 [00:00<00:00, 128.28it/s, loss=1.28]


Epoch [807/5000]: Train loss: 1.0544, Valid loss: 0.9165


Epoch [808/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.51it/s, loss=1.06]


Epoch [808/5000]: Train loss: 1.0401, Valid loss: 0.9258


Epoch [809/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.12it/s, loss=1.41]


Epoch [809/5000]: Train loss: 1.0548, Valid loss: 0.9483


Epoch [810/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.99it/s, loss=1.04]


Epoch [810/5000]: Train loss: 1.0466, Valid loss: 0.9223


Epoch [811/5000]: 100%|██████████| 14/14 [00:00<00:00, 149.76it/s, loss=1.11]


Epoch [811/5000]: Train loss: 1.0505, Valid loss: 0.9341


Epoch [812/5000]: 100%|██████████| 14/14 [00:00<00:00, 136.50it/s, loss=1.04]


Epoch [812/5000]: Train loss: 1.0349, Valid loss: 0.9524


Epoch [813/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.60it/s, loss=0.997]


Epoch [813/5000]: Train loss: 1.0437, Valid loss: 0.9192


Epoch [814/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.72it/s, loss=1.08]


Epoch [814/5000]: Train loss: 1.0445, Valid loss: 0.9474


Epoch [815/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.79it/s, loss=0.926]


Epoch [815/5000]: Train loss: 1.0535, Valid loss: 0.9207


Epoch [816/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.03it/s, loss=0.781]


Epoch [816/5000]: Train loss: 1.0279, Valid loss: 0.9339


Epoch [817/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.44it/s, loss=1.09]


Epoch [817/5000]: Train loss: 1.0412, Valid loss: 0.9350


Epoch [818/5000]: 100%|██████████| 14/14 [00:00<00:00, 164.78it/s, loss=1.01]


Epoch [818/5000]: Train loss: 1.0380, Valid loss: 0.9194


Epoch [819/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.42it/s, loss=1.05]


Epoch [819/5000]: Train loss: 1.0401, Valid loss: 0.9419


Epoch [820/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.16it/s, loss=1.01]


Epoch [820/5000]: Train loss: 1.0310, Valid loss: 0.9444


Epoch [821/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.51it/s, loss=0.952]


Epoch [821/5000]: Train loss: 1.0308, Valid loss: 0.9167


Epoch [822/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.49it/s, loss=0.976]


Epoch [822/5000]: Train loss: 1.0304, Valid loss: 0.9198


Epoch [823/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.90it/s, loss=0.885]


Epoch [823/5000]: Train loss: 1.0375, Valid loss: 0.9270


Epoch [824/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.79it/s, loss=1.13]


Epoch [824/5000]: Train loss: 1.0450, Valid loss: 0.9277


Epoch [825/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.27it/s, loss=1.21]


Epoch [825/5000]: Train loss: 1.0418, Valid loss: 0.9235


Epoch [826/5000]: 100%|██████████| 14/14 [00:00<00:00, 165.38it/s, loss=1.09]


Epoch [826/5000]: Train loss: 1.0394, Valid loss: 0.9576


Epoch [827/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.76it/s, loss=1.1]


Epoch [827/5000]: Train loss: 1.0485, Valid loss: 0.9201


Epoch [828/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.76it/s, loss=1.05]


Epoch [828/5000]: Train loss: 1.0356, Valid loss: 0.9290


Epoch [829/5000]: 100%|██████████| 14/14 [00:00<00:00, 170.42it/s, loss=0.98]


Epoch [829/5000]: Train loss: 1.0303, Valid loss: 0.9477


Epoch [830/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.04it/s, loss=1]


Epoch [830/5000]: Train loss: 1.0333, Valid loss: 0.9153


Epoch [831/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.70it/s, loss=1.07]


Epoch [831/5000]: Train loss: 1.0451, Valid loss: 0.9164


Epoch [832/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.79it/s, loss=0.909]


Epoch [832/5000]: Train loss: 1.0321, Valid loss: 0.9339


Epoch [833/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.41it/s, loss=0.861]


Epoch [833/5000]: Train loss: 1.0251, Valid loss: 0.9210


Epoch [834/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.09it/s, loss=1.05]


Epoch [834/5000]: Train loss: 1.0377, Valid loss: 0.9183


Epoch [835/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.24it/s, loss=1.08]


Epoch [835/5000]: Train loss: 1.0357, Valid loss: 0.9377


Epoch [836/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.28it/s, loss=1.12]


Epoch [836/5000]: Train loss: 1.0393, Valid loss: 0.9191


Epoch [837/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.80it/s, loss=0.991]


Epoch [837/5000]: Train loss: 1.0462, Valid loss: 0.9186


Epoch [838/5000]: 100%|██████████| 14/14 [00:00<00:00, 134.52it/s, loss=1.27]


Epoch [838/5000]: Train loss: 1.0764, Valid loss: 1.0081


Epoch [839/5000]: 100%|██████████| 14/14 [00:00<00:00, 174.04it/s, loss=0.974]


Epoch [839/5000]: Train loss: 1.0563, Valid loss: 0.9155


Epoch [840/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.76it/s, loss=1.02]


Epoch [840/5000]: Train loss: 1.0422, Valid loss: 0.9500


Epoch [841/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.34it/s, loss=1.17]


Epoch [841/5000]: Train loss: 1.0431, Valid loss: 0.9389


Epoch [842/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.60it/s, loss=0.81]


Epoch [842/5000]: Train loss: 1.0217, Valid loss: 0.9153


Epoch [843/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.70it/s, loss=0.849]


Epoch [843/5000]: Train loss: 1.0330, Valid loss: 0.9341


Epoch [844/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.48it/s, loss=1.19]


Epoch [844/5000]: Train loss: 1.0395, Valid loss: 0.9218


Epoch [845/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.27it/s, loss=1.08]


Epoch [845/5000]: Train loss: 1.0368, Valid loss: 0.9335


Epoch [846/5000]: 100%|██████████| 14/14 [00:00<00:00, 154.05it/s, loss=1.28]


Epoch [846/5000]: Train loss: 1.0447, Valid loss: 0.9191


Epoch [847/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.78it/s, loss=1]


Epoch [847/5000]: Train loss: 1.0338, Valid loss: 0.9173


Epoch [848/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.47it/s, loss=1.04]


Epoch [848/5000]: Train loss: 1.0311, Valid loss: 0.9327


Epoch [849/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.63it/s, loss=1.12]


Epoch [849/5000]: Train loss: 1.0397, Valid loss: 0.9066
Saving model with loss 0.907...


Epoch [850/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.50it/s, loss=0.986]


Epoch [850/5000]: Train loss: 1.0369, Valid loss: 0.9323


Epoch [851/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.86it/s, loss=0.811]


Epoch [851/5000]: Train loss: 1.0258, Valid loss: 0.9229


Epoch [852/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.98it/s, loss=0.927]


Epoch [852/5000]: Train loss: 1.0278, Valid loss: 0.9320


Epoch [853/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.79it/s, loss=1.1]


Epoch [853/5000]: Train loss: 1.0371, Valid loss: 0.9321


Epoch [854/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.97it/s, loss=0.968]


Epoch [854/5000]: Train loss: 1.0339, Valid loss: 0.9096


Epoch [855/5000]: 100%|██████████| 14/14 [00:00<00:00, 155.09it/s, loss=1.05]


Epoch [855/5000]: Train loss: 1.0409, Valid loss: 0.9336


Epoch [856/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.06it/s, loss=1.02]


Epoch [856/5000]: Train loss: 1.0382, Valid loss: 0.9071


Epoch [857/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.14it/s, loss=0.886]


Epoch [857/5000]: Train loss: 1.0269, Valid loss: 0.9220


Epoch [858/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.40it/s, loss=0.947]


Epoch [858/5000]: Train loss: 1.0306, Valid loss: 0.9386


Epoch [859/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.40it/s, loss=0.999]


Epoch [859/5000]: Train loss: 1.0396, Valid loss: 0.9401


Epoch [860/5000]: 100%|██████████| 14/14 [00:00<00:00, 149.85it/s, loss=0.804]


Epoch [860/5000]: Train loss: 1.0294, Valid loss: 0.9352


Epoch [861/5000]: 100%|██████████| 14/14 [00:00<00:00, 143.84it/s, loss=0.951]


Epoch [861/5000]: Train loss: 1.0464, Valid loss: 0.9230


Epoch [862/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.80it/s, loss=0.916]


Epoch [862/5000]: Train loss: 1.0397, Valid loss: 0.9393


Epoch [863/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.42it/s, loss=0.886]


Epoch [863/5000]: Train loss: 1.0270, Valid loss: 0.9093


Epoch [864/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.04it/s, loss=0.988]


Epoch [864/5000]: Train loss: 1.0370, Valid loss: 0.9255


Epoch [865/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.39it/s, loss=0.87]


Epoch [865/5000]: Train loss: 1.0254, Valid loss: 0.9350


Epoch [866/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.60it/s, loss=0.874]


Epoch [866/5000]: Train loss: 1.0226, Valid loss: 0.9204


Epoch [867/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.47it/s, loss=1.41]


Epoch [867/5000]: Train loss: 1.0511, Valid loss: 0.9160


Epoch [868/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.33it/s, loss=1.04]


Epoch [868/5000]: Train loss: 1.0365, Valid loss: 0.9136


Epoch [869/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.88it/s, loss=1.04]


Epoch [869/5000]: Train loss: 1.0317, Valid loss: 0.9110


Epoch [870/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.19it/s, loss=0.976]


Epoch [870/5000]: Train loss: 1.0345, Valid loss: 0.9246


Epoch [871/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.76it/s, loss=1.02]


Epoch [871/5000]: Train loss: 1.0349, Valid loss: 0.9310


Epoch [872/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.79it/s, loss=1.01]


Epoch [872/5000]: Train loss: 1.0322, Valid loss: 0.9211


Epoch [873/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.03it/s, loss=1.13]


Epoch [873/5000]: Train loss: 1.0407, Valid loss: 0.9712


Epoch [874/5000]: 100%|██████████| 14/14 [00:00<00:00, 210.93it/s, loss=1.16]


Epoch [874/5000]: Train loss: 1.0876, Valid loss: 0.9929


Epoch [875/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.47it/s, loss=0.999]


Epoch [875/5000]: Train loss: 1.0400, Valid loss: 0.9161


Epoch [876/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.39it/s, loss=1.08]


Epoch [876/5000]: Train loss: 1.0379, Valid loss: 0.9457


Epoch [877/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.48it/s, loss=1.2]


Epoch [877/5000]: Train loss: 1.0487, Valid loss: 0.9378


Epoch [878/5000]: 100%|██████████| 14/14 [00:00<00:00, 210.37it/s, loss=0.822]


Epoch [878/5000]: Train loss: 1.0221, Valid loss: 0.9270


Epoch [879/5000]: 100%|██████████| 14/14 [00:00<00:00, 214.65it/s, loss=1.04]


Epoch [879/5000]: Train loss: 1.0340, Valid loss: 0.9191


Epoch [880/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.90it/s, loss=1.04]


Epoch [880/5000]: Train loss: 1.0318, Valid loss: 0.9548


Epoch [881/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.92it/s, loss=0.933]


Epoch [881/5000]: Train loss: 1.0381, Valid loss: 0.9139


Epoch [882/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.86it/s, loss=0.91]


Epoch [882/5000]: Train loss: 1.0261, Valid loss: 0.9326


Epoch [883/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.40it/s, loss=0.995]


Epoch [883/5000]: Train loss: 1.0320, Valid loss: 0.9151


Epoch [884/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.76it/s, loss=1.14]


Epoch [884/5000]: Train loss: 1.0379, Valid loss: 0.9232


Epoch [885/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.94it/s, loss=0.929]


Epoch [885/5000]: Train loss: 1.0293, Valid loss: 0.9251


Epoch [886/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.46it/s, loss=1.15]


Epoch [886/5000]: Train loss: 1.0409, Valid loss: 0.9301


Epoch [887/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.77it/s, loss=0.813]


Epoch [887/5000]: Train loss: 1.0301, Valid loss: 0.9150


Epoch [888/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.35it/s, loss=1.13]


Epoch [888/5000]: Train loss: 1.0394, Valid loss: 0.9269


Epoch [889/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.96it/s, loss=0.879]


Epoch [889/5000]: Train loss: 1.0371, Valid loss: 0.9442


Epoch [890/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.11it/s, loss=1.19]


Epoch [890/5000]: Train loss: 1.0444, Valid loss: 0.9227


Epoch [891/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.60it/s, loss=1.13]


Epoch [891/5000]: Train loss: 1.0443, Valid loss: 0.9157


Epoch [892/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.79it/s, loss=1.43]


Epoch [892/5000]: Train loss: 1.0553, Valid loss: 0.9473


Epoch [893/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.62it/s, loss=0.954]


Epoch [893/5000]: Train loss: 1.0330, Valid loss: 0.9495


Epoch [894/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.60it/s, loss=0.848]


Epoch [894/5000]: Train loss: 1.0281, Valid loss: 0.9206


Epoch [895/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.56it/s, loss=1.05]


Epoch [895/5000]: Train loss: 1.0377, Valid loss: 0.9114


Epoch [896/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.38it/s, loss=1.14]


Epoch [896/5000]: Train loss: 1.0630, Valid loss: 0.9890


Epoch [897/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.93it/s, loss=1.06]


Epoch [897/5000]: Train loss: 1.0450, Valid loss: 0.9175


Epoch [898/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.50it/s, loss=1.3]


Epoch [898/5000]: Train loss: 1.0488, Valid loss: 0.9112


Epoch [899/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.04it/s, loss=0.923]


Epoch [899/5000]: Train loss: 1.0293, Valid loss: 0.9264


Epoch [900/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.32it/s, loss=1.06]


Epoch [900/5000]: Train loss: 1.0349, Valid loss: 0.9177


Epoch [901/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.46it/s, loss=0.862]


Epoch [901/5000]: Train loss: 1.0233, Valid loss: 0.9268


Epoch [902/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.68it/s, loss=0.999]


Epoch [902/5000]: Train loss: 1.0309, Valid loss: 0.9241


Epoch [903/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.76it/s, loss=1.11]


Epoch [903/5000]: Train loss: 1.0386, Valid loss: 0.9399


Epoch [904/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.92it/s, loss=0.853]


Epoch [904/5000]: Train loss: 1.0312, Valid loss: 0.9092


Epoch [905/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.95it/s, loss=1.34]


Epoch [905/5000]: Train loss: 1.0513, Valid loss: 0.9195


Epoch [906/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.94it/s, loss=1.1]


Epoch [906/5000]: Train loss: 1.0368, Valid loss: 0.9251


Epoch [907/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.14it/s, loss=0.856]


Epoch [907/5000]: Train loss: 1.0254, Valid loss: 0.9264


Epoch [908/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.44it/s, loss=0.924]


Epoch [908/5000]: Train loss: 1.0309, Valid loss: 0.9227


Epoch [909/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.01it/s, loss=0.901]


Epoch [909/5000]: Train loss: 1.0293, Valid loss: 0.9204


Epoch [910/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.70it/s, loss=0.945]


Epoch [910/5000]: Train loss: 1.0375, Valid loss: 0.9294


Epoch [911/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.57it/s, loss=1.06]


Epoch [911/5000]: Train loss: 1.0367, Valid loss: 0.9097


Epoch [912/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.80it/s, loss=1.03]


Epoch [912/5000]: Train loss: 1.0373, Valid loss: 0.9227


Epoch [913/5000]: 100%|██████████| 14/14 [00:00<00:00, 171.41it/s, loss=1.21]


Epoch [913/5000]: Train loss: 1.0441, Valid loss: 0.9249


Epoch [914/5000]: 100%|██████████| 14/14 [00:00<00:00, 154.59it/s, loss=1.01]


Epoch [914/5000]: Train loss: 1.0356, Valid loss: 0.9450


Epoch [915/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.63it/s, loss=1.03]


Epoch [915/5000]: Train loss: 1.0438, Valid loss: 0.9278


Epoch [916/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.28it/s, loss=1.01]


Epoch [916/5000]: Train loss: 1.0317, Valid loss: 0.9037
Saving model with loss 0.904...


Epoch [917/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.70it/s, loss=1.1]


Epoch [917/5000]: Train loss: 1.0370, Valid loss: 0.9298


Epoch [918/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.23it/s, loss=0.965]


Epoch [918/5000]: Train loss: 1.0315, Valid loss: 0.9242


Epoch [919/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.28it/s, loss=0.921]


Epoch [919/5000]: Train loss: 1.0352, Valid loss: 0.9895


Epoch [920/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.79it/s, loss=1.07]


Epoch [920/5000]: Train loss: 1.0471, Valid loss: 0.9140


Epoch [921/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.12it/s, loss=0.859]


Epoch [921/5000]: Train loss: 1.0299, Valid loss: 0.9178


Epoch [922/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.58it/s, loss=1.05]


Epoch [922/5000]: Train loss: 1.0333, Valid loss: 0.9500


Epoch [923/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.64it/s, loss=1.21]


Epoch [923/5000]: Train loss: 1.0542, Valid loss: 0.9203


Epoch [924/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.92it/s, loss=1.17]


Epoch [924/5000]: Train loss: 1.0551, Valid loss: 0.9278


Epoch [925/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.65it/s, loss=1.09]


Epoch [925/5000]: Train loss: 1.0430, Valid loss: 0.9366


Epoch [926/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.42it/s, loss=1.04]


Epoch [926/5000]: Train loss: 1.0587, Valid loss: 0.9246


Epoch [927/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.17it/s, loss=1]


Epoch [927/5000]: Train loss: 1.0460, Valid loss: 0.9137


Epoch [928/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.27it/s, loss=0.99]


Epoch [928/5000]: Train loss: 1.0361, Valid loss: 0.9420


Epoch [929/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.31it/s, loss=0.94]


Epoch [929/5000]: Train loss: 1.0405, Valid loss: 0.9178


Epoch [930/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.03it/s, loss=1.12]


Epoch [930/5000]: Train loss: 1.0476, Valid loss: 0.9371


Epoch [931/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.34it/s, loss=0.912]


Epoch [931/5000]: Train loss: 1.0253, Valid loss: 0.9188


Epoch [932/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.70it/s, loss=0.858]


Epoch [932/5000]: Train loss: 1.0369, Valid loss: 0.9427


Epoch [933/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.82it/s, loss=0.998]


Epoch [933/5000]: Train loss: 1.0552, Valid loss: 0.9093


Epoch [934/5000]: 100%|██████████| 14/14 [00:00<00:00, 213.90it/s, loss=1.08]


Epoch [934/5000]: Train loss: 1.0299, Valid loss: 0.9152


Epoch [935/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.13it/s, loss=1.18]


Epoch [935/5000]: Train loss: 1.0454, Valid loss: 0.9252


Epoch [936/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.69it/s, loss=0.954]


Epoch [936/5000]: Train loss: 1.0308, Valid loss: 0.9386


Epoch [937/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.73it/s, loss=1.02]


Epoch [937/5000]: Train loss: 1.0345, Valid loss: 0.9185


Epoch [938/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.68it/s, loss=0.965]


Epoch [938/5000]: Train loss: 1.0309, Valid loss: 0.9216


Epoch [939/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.54it/s, loss=0.967]


Epoch [939/5000]: Train loss: 1.0279, Valid loss: 0.9507


Epoch [940/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.07it/s, loss=1.1]


Epoch [940/5000]: Train loss: 1.0464, Valid loss: 0.9398


Epoch [941/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.54it/s, loss=0.76]


Epoch [941/5000]: Train loss: 1.0315, Valid loss: 0.9163


Epoch [942/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.71it/s, loss=0.997]


Epoch [942/5000]: Train loss: 1.0313, Valid loss: 0.9180


Epoch [943/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.95it/s, loss=0.942]


Epoch [943/5000]: Train loss: 1.0288, Valid loss: 0.9168


Epoch [944/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.05it/s, loss=1.23]


Epoch [944/5000]: Train loss: 1.0412, Valid loss: 0.9245


Epoch [945/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.58it/s, loss=0.943]


Epoch [945/5000]: Train loss: 1.0287, Valid loss: 0.9147


Epoch [946/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.87it/s, loss=1.21]


Epoch [946/5000]: Train loss: 1.0457, Valid loss: 0.9210


Epoch [947/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.92it/s, loss=0.918]


Epoch [947/5000]: Train loss: 1.0279, Valid loss: 0.9122


Epoch [948/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.48it/s, loss=0.976]


Epoch [948/5000]: Train loss: 1.0393, Valid loss: 0.9198


Epoch [949/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.02it/s, loss=1.12]


Epoch [949/5000]: Train loss: 1.0357, Valid loss: 0.9065


Epoch [950/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.98it/s, loss=0.945]


Epoch [950/5000]: Train loss: 1.0290, Valid loss: 0.9134


Epoch [951/5000]: 100%|██████████| 14/14 [00:00<00:00, 157.86it/s, loss=1.02]


Epoch [951/5000]: Train loss: 1.0357, Valid loss: 0.9464


Epoch [952/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.87it/s, loss=0.947]


Epoch [952/5000]: Train loss: 1.0482, Valid loss: 0.9288


Epoch [953/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.96it/s, loss=1.04]


Epoch [953/5000]: Train loss: 1.0467, Valid loss: 0.9384


Epoch [954/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.76it/s, loss=1.1]


Epoch [954/5000]: Train loss: 1.0494, Valid loss: 0.9359


Epoch [955/5000]: 100%|██████████| 14/14 [00:00<00:00, 212.49it/s, loss=1.05]


Epoch [955/5000]: Train loss: 1.0411, Valid loss: 0.9144


Epoch [956/5000]: 100%|██████████| 14/14 [00:00<00:00, 155.95it/s, loss=1.08]


Epoch [956/5000]: Train loss: 1.0339, Valid loss: 0.9189


Epoch [957/5000]: 100%|██████████| 14/14 [00:00<00:00, 142.84it/s, loss=0.905]


Epoch [957/5000]: Train loss: 1.0310, Valid loss: 0.9686


Epoch [958/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.84it/s, loss=1.13]


Epoch [958/5000]: Train loss: 1.0517, Valid loss: 0.9152


Epoch [959/5000]: 100%|██████████| 14/14 [00:00<00:00, 146.19it/s, loss=1.18]


Epoch [959/5000]: Train loss: 1.0436, Valid loss: 0.9186


Epoch [960/5000]: 100%|██████████| 14/14 [00:00<00:00, 154.85it/s, loss=1.04]

Epoch [960/5000]: Train loss: 1.0325, Valid loss: 0.9128







Epoch [961/5000]: 100%|██████████| 14/14 [00:00<00:00, 212.53it/s, loss=1.04]


Epoch [961/5000]: Train loss: 1.0414, Valid loss: 0.9102


Epoch [962/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.81it/s, loss=0.959]


Epoch [962/5000]: Train loss: 1.0372, Valid loss: 0.9684


Epoch [963/5000]: 100%|██████████| 14/14 [00:00<00:00, 175.01it/s, loss=1.11]


Epoch [963/5000]: Train loss: 1.0734, Valid loss: 0.9367


Epoch [964/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.80it/s, loss=0.851]


Epoch [964/5000]: Train loss: 1.0626, Valid loss: 0.9260


Epoch [965/5000]: 100%|██████████| 14/14 [00:00<00:00, 210.82it/s, loss=1.15]


Epoch [965/5000]: Train loss: 1.0531, Valid loss: 0.9277


Epoch [966/5000]: 100%|██████████| 14/14 [00:00<00:00, 212.50it/s, loss=0.944]


Epoch [966/5000]: Train loss: 1.0347, Valid loss: 0.9180


Epoch [967/5000]: 100%|██████████| 14/14 [00:00<00:00, 214.15it/s, loss=1.03]


Epoch [967/5000]: Train loss: 1.0351, Valid loss: 0.9146


Epoch [968/5000]: 100%|██████████| 14/14 [00:00<00:00, 210.69it/s, loss=1.18]


Epoch [968/5000]: Train loss: 1.0431, Valid loss: 0.9122


Epoch [969/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.56it/s, loss=1.02]


Epoch [969/5000]: Train loss: 1.0458, Valid loss: 0.9481


Epoch [970/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.61it/s, loss=1.08]


Epoch [970/5000]: Train loss: 1.0434, Valid loss: 0.9331


Epoch [971/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.56it/s, loss=1.23]


Epoch [971/5000]: Train loss: 1.0449, Valid loss: 0.9097


Epoch [972/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.29it/s, loss=0.967]


Epoch [972/5000]: Train loss: 1.0333, Valid loss: 0.9297


Epoch [973/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.70it/s, loss=1.15]


Epoch [973/5000]: Train loss: 1.0452, Valid loss: 0.9334


Epoch [974/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.36it/s, loss=0.936]


Epoch [974/5000]: Train loss: 1.0440, Valid loss: 0.9192


Epoch [975/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.21it/s, loss=0.925]


Epoch [975/5000]: Train loss: 1.0332, Valid loss: 0.9076


Epoch [976/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.43it/s, loss=1.05]


Epoch [976/5000]: Train loss: 1.0369, Valid loss: 0.9399


Epoch [977/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.73it/s, loss=0.812]


Epoch [977/5000]: Train loss: 1.0333, Valid loss: 0.9331


Epoch [978/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.41it/s, loss=0.905]


Epoch [978/5000]: Train loss: 1.0403, Valid loss: 0.9222


Epoch [979/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.36it/s, loss=0.981]


Epoch [979/5000]: Train loss: 1.0332, Valid loss: 0.9463


Epoch [980/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.10it/s, loss=1.02]


Epoch [980/5000]: Train loss: 1.0325, Valid loss: 0.9315


Epoch [981/5000]: 100%|██████████| 14/14 [00:00<00:00, 211.15it/s, loss=1.22]


Epoch [981/5000]: Train loss: 1.0422, Valid loss: 0.9248


Epoch [982/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.70it/s, loss=1.19]


Epoch [982/5000]: Train loss: 1.0431, Valid loss: 0.9360


Epoch [983/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.27it/s, loss=1.06]


Epoch [983/5000]: Train loss: 1.0322, Valid loss: 0.9169


Epoch [984/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.88it/s, loss=0.969]


Epoch [984/5000]: Train loss: 1.0264, Valid loss: 0.9113


Epoch [985/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.23it/s, loss=1.42]


Epoch [985/5000]: Train loss: 1.0500, Valid loss: 0.9301


Epoch [986/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.36it/s, loss=0.892]


Epoch [986/5000]: Train loss: 1.0358, Valid loss: 0.9468


Epoch [987/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.90it/s, loss=0.968]


Epoch [987/5000]: Train loss: 1.0392, Valid loss: 0.9171


Epoch [988/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.25it/s, loss=0.997]


Epoch [988/5000]: Train loss: 1.0359, Valid loss: 0.9201


Epoch [989/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.19it/s, loss=1.01]


Epoch [989/5000]: Train loss: 1.0337, Valid loss: 0.9487


Epoch [990/5000]: 100%|██████████| 14/14 [00:00<00:00, 110.44it/s, loss=1.05] 


Epoch [990/5000]: Train loss: 1.0612, Valid loss: 0.9645


Epoch [991/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.75it/s, loss=0.845]


Epoch [991/5000]: Train loss: 1.0268, Valid loss: 0.9076


Epoch [992/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.29it/s, loss=0.936]


Epoch [992/5000]: Train loss: 1.0255, Valid loss: 0.9634


Epoch [993/5000]: 100%|██████████| 14/14 [00:00<00:00, 214.23it/s, loss=0.937]


Epoch [993/5000]: Train loss: 1.0256, Valid loss: 0.9076


Epoch [994/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.97it/s, loss=1.03]


Epoch [994/5000]: Train loss: 1.0345, Valid loss: 0.9159


Epoch [995/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.05it/s, loss=0.999]


Epoch [995/5000]: Train loss: 1.0321, Valid loss: 0.9375


Epoch [996/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.68it/s, loss=1]


Epoch [996/5000]: Train loss: 1.0302, Valid loss: 0.9067


Epoch [997/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.30it/s, loss=0.964]


Epoch [997/5000]: Train loss: 1.0487, Valid loss: 0.9248


Epoch [998/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.84it/s, loss=0.762]


Epoch [998/5000]: Train loss: 1.0176, Valid loss: 0.9123


Epoch [999/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.55it/s, loss=0.894]


Epoch [999/5000]: Train loss: 1.0229, Valid loss: 0.9244


Epoch [1000/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.53it/s, loss=0.9]


Epoch [1000/5000]: Train loss: 1.0257, Valid loss: 0.9292


Epoch [1001/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.61it/s, loss=0.994]


Epoch [1001/5000]: Train loss: 1.0322, Valid loss: 0.9313


Epoch [1002/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.26it/s, loss=0.926]


Epoch [1002/5000]: Train loss: 1.0275, Valid loss: 0.9488


Epoch [1003/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.29it/s, loss=0.946]


Epoch [1003/5000]: Train loss: 1.0257, Valid loss: 0.9540


Epoch [1004/5000]: 100%|██████████| 14/14 [00:00<00:00, 164.25it/s, loss=0.804]


Epoch [1004/5000]: Train loss: 1.0277, Valid loss: 0.9151


Epoch [1005/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.52it/s, loss=1.06]


Epoch [1005/5000]: Train loss: 1.0349, Valid loss: 0.9153


Epoch [1006/5000]: 100%|██████████| 14/14 [00:00<00:00, 213.24it/s, loss=1.15]


Epoch [1006/5000]: Train loss: 1.0385, Valid loss: 0.9073


Epoch [1007/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.22it/s, loss=0.961]


Epoch [1007/5000]: Train loss: 1.0352, Valid loss: 0.9292


Epoch [1008/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.98it/s, loss=0.986]


Epoch [1008/5000]: Train loss: 1.0326, Valid loss: 0.9151


Epoch [1009/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.65it/s, loss=0.928]


Epoch [1009/5000]: Train loss: 1.0298, Valid loss: 0.9085


Epoch [1010/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.96it/s, loss=0.882]


Epoch [1010/5000]: Train loss: 1.0223, Valid loss: 0.9291


Epoch [1011/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.23it/s, loss=1.12]


Epoch [1011/5000]: Train loss: 1.0367, Valid loss: 0.9081


Epoch [1012/5000]: 100%|██████████| 14/14 [00:00<00:00, 214.65it/s, loss=1.12]


Epoch [1012/5000]: Train loss: 1.0360, Valid loss: 0.9138


Epoch [1013/5000]: 100%|██████████| 14/14 [00:00<00:00, 216.60it/s, loss=0.992]


Epoch [1013/5000]: Train loss: 1.0302, Valid loss: 0.9500


Epoch [1014/5000]: 100%|██████████| 14/14 [00:00<00:00, 210.97it/s, loss=1.12]


Epoch [1014/5000]: Train loss: 1.0382, Valid loss: 0.9195


Epoch [1015/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.11it/s, loss=1.26]


Epoch [1015/5000]: Train loss: 1.0603, Valid loss: 0.9297


Epoch [1016/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.87it/s, loss=0.853]


Epoch [1016/5000]: Train loss: 1.0341, Valid loss: 0.9293


Epoch [1017/5000]: 100%|██████████| 14/14 [00:00<00:00, 172.85it/s, loss=0.922]


Epoch [1017/5000]: Train loss: 1.0354, Valid loss: 0.9170


Epoch [1018/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.94it/s, loss=1.08]


Epoch [1018/5000]: Train loss: 1.0504, Valid loss: 0.9511


Epoch [1019/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.96it/s, loss=0.901]


Epoch [1019/5000]: Train loss: 1.0566, Valid loss: 0.9371


Epoch [1020/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.25it/s, loss=1.11]


Epoch [1020/5000]: Train loss: 1.0489, Valid loss: 0.9545


Epoch [1021/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.16it/s, loss=1.29]


Epoch [1021/5000]: Train loss: 1.0546, Valid loss: 0.9390


Epoch [1022/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.60it/s, loss=0.823]


Epoch [1022/5000]: Train loss: 1.0304, Valid loss: 0.9047


Epoch [1023/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.28it/s, loss=1.13]


Epoch [1023/5000]: Train loss: 1.0440, Valid loss: 0.9320


Epoch [1024/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.70it/s, loss=1.2]


Epoch [1024/5000]: Train loss: 1.0434, Valid loss: 0.9207


Epoch [1025/5000]: 100%|██████████| 14/14 [00:00<00:00, 167.06it/s, loss=1.1]


Epoch [1025/5000]: Train loss: 1.0472, Valid loss: 0.9169


Epoch [1026/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.67it/s, loss=0.979]


Epoch [1026/5000]: Train loss: 1.0356, Valid loss: 0.9363


Epoch [1027/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.15it/s, loss=1.14]


Epoch [1027/5000]: Train loss: 1.0352, Valid loss: 0.9183


Epoch [1028/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.38it/s, loss=0.951]


Epoch [1028/5000]: Train loss: 1.0282, Valid loss: 0.9232


Epoch [1029/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.84it/s, loss=0.798]


Epoch [1029/5000]: Train loss: 1.0233, Valid loss: 0.9227


Epoch [1030/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.81it/s, loss=1.15]


Epoch [1030/5000]: Train loss: 1.0381, Valid loss: 0.9689


Epoch [1031/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.11it/s, loss=0.911]


Epoch [1031/5000]: Train loss: 1.0363, Valid loss: 0.9049


Epoch [1032/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.68it/s, loss=1.06]


Epoch [1032/5000]: Train loss: 1.0384, Valid loss: 0.9144


Epoch [1033/5000]: 100%|██████████| 14/14 [00:00<00:00, 210.89it/s, loss=1.37]


Epoch [1033/5000]: Train loss: 1.0471, Valid loss: 0.9635


Epoch [1034/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.57it/s, loss=0.965]


Epoch [1034/5000]: Train loss: 1.0312, Valid loss: 0.9344


Epoch [1035/5000]: 100%|██████████| 14/14 [00:00<00:00, 211.61it/s, loss=1.02]


Epoch [1035/5000]: Train loss: 1.0489, Valid loss: 0.9211


Epoch [1036/5000]: 100%|██████████| 14/14 [00:00<00:00, 212.99it/s, loss=0.938]


Epoch [1036/5000]: Train loss: 1.0404, Valid loss: 0.9155


Epoch [1037/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.55it/s, loss=0.996]


Epoch [1037/5000]: Train loss: 1.0371, Valid loss: 0.9066


Epoch [1038/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.28it/s, loss=1.17]


Epoch [1038/5000]: Train loss: 1.0448, Valid loss: 0.9406


Epoch [1039/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.94it/s, loss=1.09]


Epoch [1039/5000]: Train loss: 1.0472, Valid loss: 0.9146


Epoch [1040/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.16it/s, loss=1.14]


Epoch [1040/5000]: Train loss: 1.0469, Valid loss: 0.9194


Epoch [1041/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.89it/s, loss=1.17]


Epoch [1041/5000]: Train loss: 1.0382, Valid loss: 0.9067


Epoch [1042/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.05it/s, loss=1.2]


Epoch [1042/5000]: Train loss: 1.0428, Valid loss: 0.9097


Epoch [1043/5000]: 100%|██████████| 14/14 [00:00<00:00, 144.96it/s, loss=1.01]


Epoch [1043/5000]: Train loss: 1.0311, Valid loss: 0.9153


Epoch [1044/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.92it/s, loss=1.16]


Epoch [1044/5000]: Train loss: 1.0364, Valid loss: 0.9239


Epoch [1045/5000]: 100%|██████████| 14/14 [00:00<00:00, 172.23it/s, loss=1.04]


Epoch [1045/5000]: Train loss: 1.0318, Valid loss: 0.9188


Epoch [1046/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.62it/s, loss=0.916]


Epoch [1046/5000]: Train loss: 1.0222, Valid loss: 0.9283


Epoch [1047/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.64it/s, loss=0.822]


Epoch [1047/5000]: Train loss: 1.0262, Valid loss: 0.9103


Epoch [1048/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.88it/s, loss=1.02]


Epoch [1048/5000]: Train loss: 1.0352, Valid loss: 0.9158


Epoch [1049/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.22it/s, loss=1.05]


Epoch [1049/5000]: Train loss: 1.0364, Valid loss: 0.9215


Epoch [1050/5000]: 100%|██████████| 14/14 [00:00<00:00, 211.76it/s, loss=0.926]


Epoch [1050/5000]: Train loss: 1.0236, Valid loss: 0.9162


Epoch [1051/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.53it/s, loss=1.15]


Epoch [1051/5000]: Train loss: 1.0425, Valid loss: 0.9109


Epoch [1052/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.79it/s, loss=1.04]


Epoch [1052/5000]: Train loss: 1.0297, Valid loss: 0.9165


Epoch [1053/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.58it/s, loss=1.24]


Epoch [1053/5000]: Train loss: 1.0417, Valid loss: 0.9259


Epoch [1054/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.49it/s, loss=1.3]


Epoch [1054/5000]: Train loss: 1.0417, Valid loss: 0.9093


Epoch [1055/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.01it/s, loss=0.883]


Epoch [1055/5000]: Train loss: 1.0255, Valid loss: 0.9222


Epoch [1056/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.55it/s, loss=1.13]


Epoch [1056/5000]: Train loss: 1.0400, Valid loss: 0.9147


Epoch [1057/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.34it/s, loss=1.33]


Epoch [1057/5000]: Train loss: 1.0467, Valid loss: 0.9301


Epoch [1058/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.63it/s, loss=1.03]


Epoch [1058/5000]: Train loss: 1.0317, Valid loss: 0.9205


Epoch [1059/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.49it/s, loss=1.08]


Epoch [1059/5000]: Train loss: 1.0314, Valid loss: 0.9124


Epoch [1060/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.71it/s, loss=1.05]


Epoch [1060/5000]: Train loss: 1.0317, Valid loss: 0.9233


Epoch [1061/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.10it/s, loss=0.931]


Epoch [1061/5000]: Train loss: 1.0273, Valid loss: 0.9118


Epoch [1062/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.28it/s, loss=1.05]


Epoch [1062/5000]: Train loss: 1.0349, Valid loss: 0.9147


Epoch [1063/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.32it/s, loss=0.935]


Epoch [1063/5000]: Train loss: 1.0308, Valid loss: 0.9182


Epoch [1064/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.59it/s, loss=0.806]


Epoch [1064/5000]: Train loss: 1.0223, Valid loss: 0.9201


Epoch [1065/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.77it/s, loss=1.39]


Epoch [1065/5000]: Train loss: 1.0450, Valid loss: 0.9181


Epoch [1066/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.83it/s, loss=1.02]


Epoch [1066/5000]: Train loss: 1.0316, Valid loss: 0.9057


Epoch [1067/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.41it/s, loss=1.13]


Epoch [1067/5000]: Train loss: 1.0379, Valid loss: 0.9892


Epoch [1068/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.83it/s, loss=1.03]


Epoch [1068/5000]: Train loss: 1.0439, Valid loss: 0.9286


Epoch [1069/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.52it/s, loss=0.9]


Epoch [1069/5000]: Train loss: 1.0226, Valid loss: 0.9230


Epoch [1070/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.96it/s, loss=1.01]


Epoch [1070/5000]: Train loss: 1.0312, Valid loss: 0.9331


Epoch [1071/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.15it/s, loss=1.02]


Epoch [1071/5000]: Train loss: 1.0359, Valid loss: 0.9056


Epoch [1072/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.59it/s, loss=1.07]


Epoch [1072/5000]: Train loss: 1.0432, Valid loss: 0.9305


Epoch [1073/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.11it/s, loss=0.951]


Epoch [1073/5000]: Train loss: 1.0307, Valid loss: 0.9169


Epoch [1074/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.74it/s, loss=1.13]


Epoch [1074/5000]: Train loss: 1.0357, Valid loss: 0.9224


Epoch [1075/5000]: 100%|██████████| 14/14 [00:00<00:00, 171.29it/s, loss=1]


Epoch [1075/5000]: Train loss: 1.0388, Valid loss: 0.9277


Epoch [1076/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.51it/s, loss=1.3]


Epoch [1076/5000]: Train loss: 1.0461, Valid loss: 0.9111


Epoch [1077/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.67it/s, loss=1.02]


Epoch [1077/5000]: Train loss: 1.0323, Valid loss: 0.9481


Epoch [1078/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.40it/s, loss=1.13]


Epoch [1078/5000]: Train loss: 1.0549, Valid loss: 0.9536


Epoch [1079/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.04it/s, loss=1.38]


Epoch [1079/5000]: Train loss: 1.0459, Valid loss: 0.9268


Epoch [1080/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.42it/s, loss=1.16]


Epoch [1080/5000]: Train loss: 1.0353, Valid loss: 0.9266


Epoch [1081/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.43it/s, loss=0.861]


Epoch [1081/5000]: Train loss: 1.0204, Valid loss: 0.9103


Epoch [1082/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.66it/s, loss=0.998]


Epoch [1082/5000]: Train loss: 1.0394, Valid loss: 0.9162


Epoch [1083/5000]: 100%|██████████| 14/14 [00:00<00:00, 223.46it/s, loss=1.08]


Epoch [1083/5000]: Train loss: 1.0337, Valid loss: 0.9630


Epoch [1084/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.28it/s, loss=0.934]


Epoch [1084/5000]: Train loss: 1.0419, Valid loss: 0.9534


Epoch [1085/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.07it/s, loss=1.34]


Epoch [1085/5000]: Train loss: 1.0579, Valid loss: 0.9197


Epoch [1086/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.35it/s, loss=0.892]


Epoch [1086/5000]: Train loss: 1.0417, Valid loss: 0.9165


Epoch [1087/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.95it/s, loss=0.882]


Epoch [1087/5000]: Train loss: 1.0258, Valid loss: 0.9163


Epoch [1088/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.81it/s, loss=0.849]


Epoch [1088/5000]: Train loss: 1.0252, Valid loss: 0.9204


Epoch [1089/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.54it/s, loss=1.18]


Epoch [1089/5000]: Train loss: 1.0398, Valid loss: 0.9072


Epoch [1090/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.43it/s, loss=1.29]


Epoch [1090/5000]: Train loss: 1.0480, Valid loss: 0.9240


Epoch [1091/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.57it/s, loss=0.886]


Epoch [1091/5000]: Train loss: 1.0397, Valid loss: 0.9177


Epoch [1092/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.93it/s, loss=0.733]


Epoch [1092/5000]: Train loss: 1.0194, Valid loss: 0.9195


Epoch [1093/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.49it/s, loss=1.1]


Epoch [1093/5000]: Train loss: 1.0359, Valid loss: 0.9119


Epoch [1094/5000]: 100%|██████████| 14/14 [00:00<00:00, 157.01it/s, loss=0.897]


Epoch [1094/5000]: Train loss: 1.0308, Valid loss: 0.9489


Epoch [1095/5000]: 100%|██████████| 14/14 [00:00<00:00, 151.58it/s, loss=1.11]


Epoch [1095/5000]: Train loss: 1.0441, Valid loss: 0.9157


Epoch [1096/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.90it/s, loss=0.967]


Epoch [1096/5000]: Train loss: 1.0299, Valid loss: 0.9239


Epoch [1097/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.97it/s, loss=0.966]


Epoch [1097/5000]: Train loss: 1.0319, Valid loss: 0.9718


Epoch [1098/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.19it/s, loss=1.03]


Epoch [1098/5000]: Train loss: 1.0400, Valid loss: 0.9118


Epoch [1099/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.46it/s, loss=0.876]


Epoch [1099/5000]: Train loss: 1.0265, Valid loss: 0.9301


Epoch [1100/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.90it/s, loss=1.22]


Epoch [1100/5000]: Train loss: 1.0409, Valid loss: 0.9440


Epoch [1101/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.30it/s, loss=0.798]


Epoch [1101/5000]: Train loss: 1.0265, Valid loss: 0.9163


Epoch [1102/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.50it/s, loss=1.22]


Epoch [1102/5000]: Train loss: 1.0446, Valid loss: 0.9144


Epoch [1103/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.35it/s, loss=1.13]


Epoch [1103/5000]: Train loss: 1.0365, Valid loss: 0.9233


Epoch [1104/5000]: 100%|██████████| 14/14 [00:00<00:00, 177.35it/s, loss=0.87]


Epoch [1104/5000]: Train loss: 1.0250, Valid loss: 0.9129


Epoch [1105/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.31it/s, loss=1.3]


Epoch [1105/5000]: Train loss: 1.0465, Valid loss: 0.9297


Epoch [1106/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.04it/s, loss=0.96]


Epoch [1106/5000]: Train loss: 1.0258, Valid loss: 0.9316


Epoch [1107/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.76it/s, loss=1.22]


Epoch [1107/5000]: Train loss: 1.0436, Valid loss: 0.9448


Epoch [1108/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.70it/s, loss=0.952]


Epoch [1108/5000]: Train loss: 1.0368, Valid loss: 0.9068


Epoch [1109/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.58it/s, loss=0.947]


Epoch [1109/5000]: Train loss: 1.0345, Valid loss: 0.9589


Epoch [1110/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.67it/s, loss=1.03]


Epoch [1110/5000]: Train loss: 1.0324, Valid loss: 0.9502


Epoch [1111/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.92it/s, loss=1.22]


Epoch [1111/5000]: Train loss: 1.0405, Valid loss: 0.9509


Epoch [1112/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.08it/s, loss=0.899]


Epoch [1112/5000]: Train loss: 1.0309, Valid loss: 0.9257


Epoch [1113/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.54it/s, loss=0.93]


Epoch [1113/5000]: Train loss: 1.0323, Valid loss: 0.9103


Epoch [1114/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.99it/s, loss=1.44]


Epoch [1114/5000]: Train loss: 1.0457, Valid loss: 0.9302


Epoch [1115/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.45it/s, loss=1.05]


Epoch [1115/5000]: Train loss: 1.0341, Valid loss: 0.9187


Epoch [1116/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.83it/s, loss=1.01]


Epoch [1116/5000]: Train loss: 1.0289, Valid loss: 0.9110


Epoch [1117/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.03it/s, loss=0.971]


Epoch [1117/5000]: Train loss: 1.0269, Valid loss: 0.9266


Epoch [1118/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.65it/s, loss=1.14]


Epoch [1118/5000]: Train loss: 1.0334, Valid loss: 0.9182


Epoch [1119/5000]: 100%|██████████| 14/14 [00:00<00:00, 142.34it/s, loss=1.04]


Epoch [1119/5000]: Train loss: 1.0320, Valid loss: 0.9126


Epoch [1120/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.57it/s, loss=0.934]


Epoch [1120/5000]: Train loss: 1.0299, Valid loss: 0.9101


Epoch [1121/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.16it/s, loss=1.06]


Epoch [1121/5000]: Train loss: 1.0405, Valid loss: 0.9281


Epoch [1122/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.49it/s, loss=1.22]


Epoch [1122/5000]: Train loss: 1.0397, Valid loss: 0.9364


Epoch [1123/5000]: 100%|██████████| 14/14 [00:00<00:00, 162.07it/s, loss=0.863]


Epoch [1123/5000]: Train loss: 1.0257, Valid loss: 1.0071


Epoch [1124/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.16it/s, loss=0.92]


Epoch [1124/5000]: Train loss: 1.0362, Valid loss: 0.9077


Epoch [1125/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.71it/s, loss=1.1]


Epoch [1125/5000]: Train loss: 1.0466, Valid loss: 0.9445


Epoch [1126/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.32it/s, loss=1.18]


Epoch [1126/5000]: Train loss: 1.0437, Valid loss: 0.9336


Epoch [1127/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.32it/s, loss=0.976]


Epoch [1127/5000]: Train loss: 1.0318, Valid loss: 0.9231


Epoch [1128/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.82it/s, loss=0.882]


Epoch [1128/5000]: Train loss: 1.0258, Valid loss: 0.9152


Epoch [1129/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.17it/s, loss=0.962]


Epoch [1129/5000]: Train loss: 1.0315, Valid loss: 0.9228


Epoch [1130/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.10it/s, loss=0.983]


Epoch [1130/5000]: Train loss: 1.0317, Valid loss: 0.9198


Epoch [1131/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.74it/s, loss=0.962]


Epoch [1131/5000]: Train loss: 1.0282, Valid loss: 0.9229


Epoch [1132/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.90it/s, loss=1.01]


Epoch [1132/5000]: Train loss: 1.0302, Valid loss: 0.9205


Epoch [1133/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.98it/s, loss=1.05]


Epoch [1133/5000]: Train loss: 1.0297, Valid loss: 0.9128


Epoch [1134/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.56it/s, loss=1.08]


Epoch [1134/5000]: Train loss: 1.0348, Valid loss: 0.9195


Epoch [1135/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.60it/s, loss=0.983]


Epoch [1135/5000]: Train loss: 1.0272, Valid loss: 0.9267


Epoch [1136/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.72it/s, loss=1.2]


Epoch [1136/5000]: Train loss: 1.0383, Valid loss: 0.9127


Epoch [1137/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.91it/s, loss=1.04]


Epoch [1137/5000]: Train loss: 1.0656, Valid loss: 0.9375


Epoch [1138/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.97it/s, loss=1.03]


Epoch [1138/5000]: Train loss: 1.0332, Valid loss: 0.9152


Epoch [1139/5000]: 100%|██████████| 14/14 [00:00<00:00, 171.02it/s, loss=1.02]


Epoch [1139/5000]: Train loss: 1.0305, Valid loss: 0.9094


Epoch [1140/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.06it/s, loss=0.912]


Epoch [1140/5000]: Train loss: 1.0483, Valid loss: 1.0090


Epoch [1141/5000]: 100%|██████████| 14/14 [00:00<00:00, 211.79it/s, loss=1]


Epoch [1141/5000]: Train loss: 1.0510, Valid loss: 0.9279


Epoch [1142/5000]: 100%|██████████| 14/14 [00:00<00:00, 212.98it/s, loss=1.09]


Epoch [1142/5000]: Train loss: 1.0395, Valid loss: 0.9126


Epoch [1143/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.17it/s, loss=1.07]


Epoch [1143/5000]: Train loss: 1.0333, Valid loss: 0.9175


Epoch [1144/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.94it/s, loss=0.91]


Epoch [1144/5000]: Train loss: 1.0248, Valid loss: 0.9425


Epoch [1145/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.23it/s, loss=0.945]


Epoch [1145/5000]: Train loss: 1.0260, Valid loss: 0.9422


Epoch [1146/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.49it/s, loss=0.956]


Epoch [1146/5000]: Train loss: 1.0303, Valid loss: 0.9077


Epoch [1147/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.78it/s, loss=1.06]


Epoch [1147/5000]: Train loss: 1.0332, Valid loss: 0.9060


Epoch [1148/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.71it/s, loss=1.02]


Epoch [1148/5000]: Train loss: 1.0448, Valid loss: 0.9158


Epoch [1149/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.05it/s, loss=1.06]


Epoch [1149/5000]: Train loss: 1.0527, Valid loss: 0.9619


Epoch [1150/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.62it/s, loss=1.2]


Epoch [1150/5000]: Train loss: 1.0519, Valid loss: 0.9272


Epoch [1151/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.44it/s, loss=1.04]


Epoch [1151/5000]: Train loss: 1.0392, Valid loss: 0.9218


Epoch [1152/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.12it/s, loss=0.944]


Epoch [1152/5000]: Train loss: 1.0270, Valid loss: 0.9237


Epoch [1153/5000]: 100%|██████████| 14/14 [00:00<00:00, 159.49it/s, loss=1.16]


Epoch [1153/5000]: Train loss: 1.0361, Valid loss: 0.9277


Epoch [1154/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.87it/s, loss=0.888]


Epoch [1154/5000]: Train loss: 1.0251, Valid loss: 0.9120


Epoch [1155/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.65it/s, loss=1.41]


Epoch [1155/5000]: Train loss: 1.0454, Valid loss: 0.9141


Epoch [1156/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.66it/s, loss=1.08]


Epoch [1156/5000]: Train loss: 1.0360, Valid loss: 0.9474


Epoch [1157/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.97it/s, loss=1.03]


Epoch [1157/5000]: Train loss: 1.0403, Valid loss: 0.9348


Epoch [1158/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.78it/s, loss=1]


Epoch [1158/5000]: Train loss: 1.0316, Valid loss: 0.9220


Epoch [1159/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.43it/s, loss=1.02]


Epoch [1159/5000]: Train loss: 1.0307, Valid loss: 0.9261


Epoch [1160/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.37it/s, loss=1.03]


Epoch [1160/5000]: Train loss: 1.0368, Valid loss: 0.9661


Epoch [1161/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.32it/s, loss=1.01]


Epoch [1161/5000]: Train loss: 1.0317, Valid loss: 0.9295


Epoch [1162/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.63it/s, loss=0.952]


Epoch [1162/5000]: Train loss: 1.0278, Valid loss: 0.9133


Epoch [1163/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.77it/s, loss=0.846]


Epoch [1163/5000]: Train loss: 1.0215, Valid loss: 0.9842


Epoch [1164/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.30it/s, loss=0.967]


Epoch [1164/5000]: Train loss: 1.0308, Valid loss: 0.9094


Epoch [1165/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.23it/s, loss=1.05]


Epoch [1165/5000]: Train loss: 1.0298, Valid loss: 0.9163


Epoch [1166/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.76it/s, loss=1.08]


Epoch [1166/5000]: Train loss: 1.0507, Valid loss: 0.9548


Epoch [1167/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.01it/s, loss=1.08]


Epoch [1167/5000]: Train loss: 1.0374, Valid loss: 0.9138


Epoch [1168/5000]: 100%|██████████| 14/14 [00:00<00:00, 173.95it/s, loss=1.07]


Epoch [1168/5000]: Train loss: 1.0370, Valid loss: 0.9281


Epoch [1169/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.89it/s, loss=1.1]


Epoch [1169/5000]: Train loss: 1.0334, Valid loss: 0.9260


Epoch [1170/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.33it/s, loss=1.17]


Epoch [1170/5000]: Train loss: 1.0352, Valid loss: 0.9181


Epoch [1171/5000]: 100%|██████████| 14/14 [00:00<00:00, 163.18it/s, loss=0.853]


Epoch [1171/5000]: Train loss: 1.0324, Valid loss: 0.9275


Epoch [1172/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.52it/s, loss=0.946]


Epoch [1172/5000]: Train loss: 1.0282, Valid loss: 0.9390


Epoch [1173/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.84it/s, loss=0.921]


Epoch [1173/5000]: Train loss: 1.0264, Valid loss: 0.9426


Epoch [1174/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.15it/s, loss=1.16]


Epoch [1174/5000]: Train loss: 1.0406, Valid loss: 0.9108


Epoch [1175/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.17it/s, loss=1.15]


Epoch [1175/5000]: Train loss: 1.0363, Valid loss: 0.9048


Epoch [1176/5000]: 100%|██████████| 14/14 [00:00<00:00, 171.89it/s, loss=1.08]


Epoch [1176/5000]: Train loss: 1.0307, Valid loss: 0.9250


Epoch [1177/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.70it/s, loss=0.83]


Epoch [1177/5000]: Train loss: 1.0262, Valid loss: 0.9207


Epoch [1178/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.08it/s, loss=0.99]


Epoch [1178/5000]: Train loss: 1.0256, Valid loss: 0.9414


Epoch [1179/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.50it/s, loss=0.963]


Epoch [1179/5000]: Train loss: 1.0350, Valid loss: 0.9297


Epoch [1180/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.38it/s, loss=0.827]


Epoch [1180/5000]: Train loss: 1.0336, Valid loss: 0.9141


Epoch [1181/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.10it/s, loss=1.05]


Epoch [1181/5000]: Train loss: 1.0442, Valid loss: 0.9234


Epoch [1182/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.07it/s, loss=1.48]


Epoch [1182/5000]: Train loss: 1.0506, Valid loss: 0.9549


Epoch [1183/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.78it/s, loss=1.01]


Epoch [1183/5000]: Train loss: 1.0273, Valid loss: 0.9163


Epoch [1184/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.71it/s, loss=0.917]


Epoch [1184/5000]: Train loss: 1.0241, Valid loss: 0.9203


Epoch [1185/5000]: 100%|██████████| 14/14 [00:00<00:00, 159.73it/s, loss=0.786]


Epoch [1185/5000]: Train loss: 1.0164, Valid loss: 0.9204


Epoch [1186/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.18it/s, loss=0.943]


Epoch [1186/5000]: Train loss: 1.0258, Valid loss: 0.9122


Epoch [1187/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.27it/s, loss=1.01]


Epoch [1187/5000]: Train loss: 1.0285, Valid loss: 0.9246


Epoch [1188/5000]: 100%|██████████| 14/14 [00:00<00:00, 175.65it/s, loss=1.2]


Epoch [1188/5000]: Train loss: 1.0335, Valid loss: 0.9246


Epoch [1189/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.24it/s, loss=0.81]


Epoch [1189/5000]: Train loss: 1.0171, Valid loss: 0.9135


Epoch [1190/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.90it/s, loss=0.878]


Epoch [1190/5000]: Train loss: 1.0335, Valid loss: 0.9884


Epoch [1191/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.52it/s, loss=1.35]


Epoch [1191/5000]: Train loss: 1.0609, Valid loss: 0.9136


Epoch [1192/5000]: 100%|██████████| 14/14 [00:00<00:00, 151.18it/s, loss=1.18]


Epoch [1192/5000]: Train loss: 1.0373, Valid loss: 0.9511


Epoch [1193/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.19it/s, loss=1.1]


Epoch [1193/5000]: Train loss: 1.0323, Valid loss: 0.9373


Epoch [1194/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.13it/s, loss=1.05]


Epoch [1194/5000]: Train loss: 1.0351, Valid loss: 0.9268


Epoch [1195/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.30it/s, loss=1.06]


Epoch [1195/5000]: Train loss: 1.0339, Valid loss: 0.9121


Epoch [1196/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.30it/s, loss=1.38]


Epoch [1196/5000]: Train loss: 1.0518, Valid loss: 0.9105


Epoch [1197/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.49it/s, loss=0.955]


Epoch [1197/5000]: Train loss: 1.0370, Valid loss: 0.9209


Epoch [1198/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.05it/s, loss=1.03]


Epoch [1198/5000]: Train loss: 1.0357, Valid loss: 0.9156


Epoch [1199/5000]: 100%|██████████| 14/14 [00:00<00:00, 183.78it/s, loss=0.929]


Epoch [1199/5000]: Train loss: 1.0252, Valid loss: 0.9300


Epoch [1200/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.98it/s, loss=1.07]


Epoch [1200/5000]: Train loss: 1.0325, Valid loss: 0.9138


Epoch [1201/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.68it/s, loss=0.948]


Epoch [1201/5000]: Train loss: 1.0238, Valid loss: 0.9045


Epoch [1202/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.58it/s, loss=0.881]


Epoch [1202/5000]: Train loss: 1.0213, Valid loss: 0.9194


Epoch [1203/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.66it/s, loss=0.955]


Epoch [1203/5000]: Train loss: 1.0272, Valid loss: 0.9339


Epoch [1204/5000]: 100%|██████████| 14/14 [00:00<00:00, 175.61it/s, loss=0.928]


Epoch [1204/5000]: Train loss: 1.0210, Valid loss: 0.9129


Epoch [1205/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.02it/s, loss=1.06]


Epoch [1205/5000]: Train loss: 1.0289, Valid loss: 0.9061


Epoch [1206/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.48it/s, loss=1]


Epoch [1206/5000]: Train loss: 1.0323, Valid loss: 0.9324


Epoch [1207/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.08it/s, loss=0.917]


Epoch [1207/5000]: Train loss: 1.0222, Valid loss: 0.9240


Epoch [1208/5000]: 100%|██████████| 14/14 [00:00<00:00, 151.76it/s, loss=1.03]


Epoch [1208/5000]: Train loss: 1.0362, Valid loss: 0.9101


Epoch [1209/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.80it/s, loss=1.21]


Epoch [1209/5000]: Train loss: 1.0385, Valid loss: 0.9112


Epoch [1210/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.62it/s, loss=1.22]


Epoch [1210/5000]: Train loss: 1.0493, Valid loss: 0.9334


Epoch [1211/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.37it/s, loss=0.939]


Epoch [1211/5000]: Train loss: 1.0291, Valid loss: 0.9132


Epoch [1212/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.12it/s, loss=0.885]


Epoch [1212/5000]: Train loss: 1.0271, Valid loss: 0.9449


Epoch [1213/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.12it/s, loss=0.949]


Epoch [1213/5000]: Train loss: 1.0314, Valid loss: 0.9102


Epoch [1214/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.14it/s, loss=1.04]


Epoch [1214/5000]: Train loss: 1.0364, Valid loss: 0.9690


Epoch [1215/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.50it/s, loss=0.946]


Epoch [1215/5000]: Train loss: 1.0351, Valid loss: 0.9153


Epoch [1216/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.76it/s, loss=0.833]


Epoch [1216/5000]: Train loss: 1.0218, Valid loss: 0.9127


Epoch [1217/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.71it/s, loss=1.14]


Epoch [1217/5000]: Train loss: 1.0335, Valid loss: 0.9334


Epoch [1218/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.28it/s, loss=1.15]


Epoch [1218/5000]: Train loss: 1.0378, Valid loss: 0.9145


Epoch [1219/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.36it/s, loss=1.09]


Epoch [1219/5000]: Train loss: 1.0328, Valid loss: 0.9168


Epoch [1220/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.14it/s, loss=0.834]


Epoch [1220/5000]: Train loss: 1.0200, Valid loss: 0.9398


Epoch [1221/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.61it/s, loss=1]


Epoch [1221/5000]: Train loss: 1.0286, Valid loss: 0.9068


Epoch [1222/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.17it/s, loss=1.01]


Epoch [1222/5000]: Train loss: 1.0311, Valid loss: 0.9204


Epoch [1223/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.87it/s, loss=1.05]


Epoch [1223/5000]: Train loss: 1.0401, Valid loss: 0.9187


Epoch [1224/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.67it/s, loss=0.946]


Epoch [1224/5000]: Train loss: 1.0256, Valid loss: 0.9188


Epoch [1225/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.43it/s, loss=0.864]


Epoch [1225/5000]: Train loss: 1.0227, Valid loss: 0.9385


Epoch [1226/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.77it/s, loss=1.02]


Epoch [1226/5000]: Train loss: 1.0285, Valid loss: 0.9115


Epoch [1227/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.31it/s, loss=1.25]


Epoch [1227/5000]: Train loss: 1.0434, Valid loss: 0.9206


Epoch [1228/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.43it/s, loss=1.03]


Epoch [1228/5000]: Train loss: 1.0279, Valid loss: 0.9144


Epoch [1229/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.41it/s, loss=0.889]


Epoch [1229/5000]: Train loss: 1.0299, Valid loss: 0.9705


Epoch [1230/5000]: 100%|██████████| 14/14 [00:00<00:00, 212.21it/s, loss=1.18]


Epoch [1230/5000]: Train loss: 1.0410, Valid loss: 0.9077


Epoch [1231/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.12it/s, loss=0.867]


Epoch [1231/5000]: Train loss: 1.0205, Valid loss: 0.9362


Epoch [1232/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.50it/s, loss=1.19]


Epoch [1232/5000]: Train loss: 1.0415, Valid loss: 0.9146


Epoch [1233/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.39it/s, loss=0.883]


Epoch [1233/5000]: Train loss: 1.0268, Valid loss: 0.9206


Epoch [1234/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.25it/s, loss=0.984]


Epoch [1234/5000]: Train loss: 1.0256, Valid loss: 0.9191


Epoch [1235/5000]: 100%|██████████| 14/14 [00:00<00:00, 172.96it/s, loss=1.17]


Epoch [1235/5000]: Train loss: 1.0360, Valid loss: 0.9145


Epoch [1236/5000]: 100%|██████████| 14/14 [00:00<00:00, 170.88it/s, loss=0.966]


Epoch [1236/5000]: Train loss: 1.0259, Valid loss: 0.9115


Epoch [1237/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.67it/s, loss=0.682]


Epoch [1237/5000]: Train loss: 1.0159, Valid loss: 0.9347


Epoch [1238/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.54it/s, loss=1.1]


Epoch [1238/5000]: Train loss: 1.0425, Valid loss: 1.0102


Epoch [1239/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.40it/s, loss=1.13]


Epoch [1239/5000]: Train loss: 1.0526, Valid loss: 0.9145


Epoch [1240/5000]: 100%|██████████| 14/14 [00:00<00:00, 211.10it/s, loss=1.04]


Epoch [1240/5000]: Train loss: 1.0368, Valid loss: 0.9304


Epoch [1241/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.20it/s, loss=1.48]


Epoch [1241/5000]: Train loss: 1.0545, Valid loss: 0.9237


Epoch [1242/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.29it/s, loss=0.938]


Epoch [1242/5000]: Train loss: 1.0276, Valid loss: 0.9122


Epoch [1243/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.47it/s, loss=0.828]


Epoch [1243/5000]: Train loss: 1.0167, Valid loss: 0.9272


Epoch [1244/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.20it/s, loss=0.921]


Epoch [1244/5000]: Train loss: 1.0276, Valid loss: 0.9094


Epoch [1245/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.49it/s, loss=1.2]


Epoch [1245/5000]: Train loss: 1.0399, Valid loss: 0.9199


Epoch [1246/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.12it/s, loss=0.875]


Epoch [1246/5000]: Train loss: 1.0225, Valid loss: 0.9512


Epoch [1247/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.47it/s, loss=0.759]


Epoch [1247/5000]: Train loss: 1.0292, Valid loss: 0.9240


Epoch [1248/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.50it/s, loss=1.34]


Epoch [1248/5000]: Train loss: 1.0485, Valid loss: 0.9215


Epoch [1249/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.67it/s, loss=1.09]


Epoch [1249/5000]: Train loss: 1.0287, Valid loss: 0.9162


Epoch [1250/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.72it/s, loss=1.08]


Epoch [1250/5000]: Train loss: 1.0261, Valid loss: 0.9320


Epoch [1251/5000]: 100%|██████████| 14/14 [00:00<00:00, 210.40it/s, loss=1.05]


Epoch [1251/5000]: Train loss: 1.0296, Valid loss: 0.9192


Epoch [1252/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.54it/s, loss=1.21]


Epoch [1252/5000]: Train loss: 1.0574, Valid loss: 0.9442


Epoch [1253/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.56it/s, loss=1.02]


Epoch [1253/5000]: Train loss: 1.0345, Valid loss: 0.9144


Epoch [1254/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.42it/s, loss=0.966]


Epoch [1254/5000]: Train loss: 1.0249, Valid loss: 0.9257


Epoch [1255/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.18it/s, loss=1.11]


Epoch [1255/5000]: Train loss: 1.0487, Valid loss: 0.9641


Epoch [1256/5000]: 100%|██████████| 14/14 [00:00<00:00, 156.90it/s, loss=1]


Epoch [1256/5000]: Train loss: 1.0570, Valid loss: 0.9557


Epoch [1257/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.71it/s, loss=1.02]


Epoch [1257/5000]: Train loss: 1.0611, Valid loss: 0.9288


Epoch [1258/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.53it/s, loss=1.04]


Epoch [1258/5000]: Train loss: 1.0375, Valid loss: 0.9473


Epoch [1259/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.79it/s, loss=1.06]


Epoch [1259/5000]: Train loss: 1.0266, Valid loss: 0.9186


Epoch [1260/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.37it/s, loss=0.954]


Epoch [1260/5000]: Train loss: 1.0273, Valid loss: 0.9409


Epoch [1261/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.62it/s, loss=1.03]


Epoch [1261/5000]: Train loss: 1.0262, Valid loss: 0.9161


Epoch [1262/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.08it/s, loss=0.93]


Epoch [1262/5000]: Train loss: 1.0277, Valid loss: 0.9229


Epoch [1263/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.21it/s, loss=0.99]


Epoch [1263/5000]: Train loss: 1.0503, Valid loss: 0.9648


Epoch [1264/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.74it/s, loss=1.06]


Epoch [1264/5000]: Train loss: 1.0401, Valid loss: 0.9644


Epoch [1265/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.50it/s, loss=0.996]


Epoch [1265/5000]: Train loss: 1.0354, Valid loss: 0.9096


Epoch [1266/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.10it/s, loss=1.14]


Epoch [1266/5000]: Train loss: 1.0373, Valid loss: 0.9346


Epoch [1267/5000]: 100%|██████████| 14/14 [00:00<00:00, 187.71it/s, loss=1.14]


Epoch [1267/5000]: Train loss: 1.0315, Valid loss: 0.9122


Epoch [1268/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.48it/s, loss=1.09]


Epoch [1268/5000]: Train loss: 1.0319, Valid loss: 0.9091


Epoch [1269/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.70it/s, loss=0.944]


Epoch [1269/5000]: Train loss: 1.0273, Valid loss: 0.9249


Epoch [1270/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.42it/s, loss=1.2]


Epoch [1270/5000]: Train loss: 1.0355, Valid loss: 0.9281


Epoch [1271/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.00it/s, loss=1.02]


Epoch [1271/5000]: Train loss: 1.0241, Valid loss: 0.9212


Epoch [1272/5000]: 100%|██████████| 14/14 [00:00<00:00, 214.31it/s, loss=0.979]


Epoch [1272/5000]: Train loss: 1.0231, Valid loss: 0.9076


Epoch [1273/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.24it/s, loss=0.973]


Epoch [1273/5000]: Train loss: 1.0397, Valid loss: 0.9494


Epoch [1274/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.51it/s, loss=0.965]


Epoch [1274/5000]: Train loss: 1.0313, Valid loss: 0.9385


Epoch [1275/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.19it/s, loss=0.93]


Epoch [1275/5000]: Train loss: 1.0225, Valid loss: 0.9444


Epoch [1276/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.00it/s, loss=0.924]


Epoch [1276/5000]: Train loss: 1.0276, Valid loss: 0.9237


Epoch [1277/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.63it/s, loss=1.01]


Epoch [1277/5000]: Train loss: 1.0298, Valid loss: 0.9265


Epoch [1278/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.21it/s, loss=0.968]


Epoch [1278/5000]: Train loss: 1.0298, Valid loss: 0.9281


Epoch [1279/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.76it/s, loss=1.2]


Epoch [1279/5000]: Train loss: 1.0389, Valid loss: 0.9342


Epoch [1280/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.97it/s, loss=0.804]


Epoch [1280/5000]: Train loss: 1.0174, Valid loss: 0.9110


Epoch [1281/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.17it/s, loss=0.742]


Epoch [1281/5000]: Train loss: 1.0115, Valid loss: 0.9143


Epoch [1282/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.39it/s, loss=1.11]


Epoch [1282/5000]: Train loss: 1.0329, Valid loss: 0.9261


Epoch [1283/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.02it/s, loss=1.02]


Epoch [1283/5000]: Train loss: 1.0427, Valid loss: 0.9507


Epoch [1284/5000]: 100%|██████████| 14/14 [00:00<00:00, 185.66it/s, loss=0.927]


Epoch [1284/5000]: Train loss: 1.0454, Valid loss: 0.9148


Epoch [1285/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.58it/s, loss=1.2]


Epoch [1285/5000]: Train loss: 1.0525, Valid loss: 0.9405


Epoch [1286/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.71it/s, loss=1.11]


Epoch [1286/5000]: Train loss: 1.0322, Valid loss: 0.9653


Epoch [1287/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.21it/s, loss=1.1]


Epoch [1287/5000]: Train loss: 1.0477, Valid loss: 0.9488


Epoch [1288/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.33it/s, loss=1.27]


Epoch [1288/5000]: Train loss: 1.0425, Valid loss: 0.9132


Epoch [1289/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.51it/s, loss=1.07]


Epoch [1289/5000]: Train loss: 1.0420, Valid loss: 0.9300


Epoch [1290/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.94it/s, loss=1.05]


Epoch [1290/5000]: Train loss: 1.0463, Valid loss: 0.9701


Epoch [1291/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.11it/s, loss=0.783]


Epoch [1291/5000]: Train loss: 1.0231, Valid loss: 0.9491


Epoch [1292/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.02it/s, loss=1.1]


Epoch [1292/5000]: Train loss: 1.0343, Valid loss: 0.9226


Epoch [1293/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.82it/s, loss=1.01]


Epoch [1293/5000]: Train loss: 1.0278, Valid loss: 0.9256


Epoch [1294/5000]: 100%|██████████| 14/14 [00:00<00:00, 175.72it/s, loss=1.01]


Epoch [1294/5000]: Train loss: 1.0469, Valid loss: 0.9296


Epoch [1295/5000]: 100%|██████████| 14/14 [00:00<00:00, 186.74it/s, loss=1.07]


Epoch [1295/5000]: Train loss: 1.0404, Valid loss: 0.9742


Epoch [1296/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.97it/s, loss=1.07]


Epoch [1296/5000]: Train loss: 1.0406, Valid loss: 0.9339


Epoch [1297/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.70it/s, loss=1.09]


Epoch [1297/5000]: Train loss: 1.0322, Valid loss: 0.9146


Epoch [1298/5000]: 100%|██████████| 14/14 [00:00<00:00, 176.44it/s, loss=0.816]


Epoch [1298/5000]: Train loss: 1.0203, Valid loss: 0.9199


Epoch [1299/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.81it/s, loss=0.841]


Epoch [1299/5000]: Train loss: 1.0181, Valid loss: 0.9184


Epoch [1300/5000]: 100%|██████████| 14/14 [00:00<00:00, 211.65it/s, loss=0.98]


Epoch [1300/5000]: Train loss: 1.0235, Valid loss: 0.9204


Epoch [1301/5000]: 100%|██████████| 14/14 [00:00<00:00, 214.14it/s, loss=0.92]


Epoch [1301/5000]: Train loss: 1.0311, Valid loss: 0.9304


Epoch [1302/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.09it/s, loss=1.13]


Epoch [1302/5000]: Train loss: 1.0341, Valid loss: 0.9262


Epoch [1303/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.15it/s, loss=0.973]


Epoch [1303/5000]: Train loss: 1.0296, Valid loss: 0.9539


Epoch [1304/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.68it/s, loss=0.931]


Epoch [1304/5000]: Train loss: 1.0267, Valid loss: 0.9377


Epoch [1305/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.92it/s, loss=1.2]


Epoch [1305/5000]: Train loss: 1.0341, Valid loss: 0.9500


Epoch [1306/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.93it/s, loss=1.26]


Epoch [1306/5000]: Train loss: 1.0341, Valid loss: 0.9152


Epoch [1307/5000]: 100%|██████████| 14/14 [00:00<00:00, 178.50it/s, loss=1.15]


Epoch [1307/5000]: Train loss: 1.0358, Valid loss: 0.9335


Epoch [1308/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.06it/s, loss=1.18]


Epoch [1308/5000]: Train loss: 1.0334, Valid loss: 0.9235


Epoch [1309/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.64it/s, loss=0.996]


Epoch [1309/5000]: Train loss: 1.0302, Valid loss: 0.9387


Epoch [1310/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.25it/s, loss=1.23]


Epoch [1310/5000]: Train loss: 1.0376, Valid loss: 0.9180


Epoch [1311/5000]: 100%|██████████| 14/14 [00:00<00:00, 196.38it/s, loss=0.865]


Epoch [1311/5000]: Train loss: 1.0188, Valid loss: 0.9229


Epoch [1312/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.06it/s, loss=0.879]


Epoch [1312/5000]: Train loss: 1.0286, Valid loss: 0.9489


Epoch [1313/5000]: 100%|██████████| 14/14 [00:00<00:00, 165.62it/s, loss=0.993]


Epoch [1313/5000]: Train loss: 1.0241, Valid loss: 0.9108


Epoch [1314/5000]: 100%|██████████| 14/14 [00:00<00:00, 142.50it/s, loss=0.936]


Epoch [1314/5000]: Train loss: 1.0260, Valid loss: 0.9255


Epoch [1315/5000]: 100%|██████████| 14/14 [00:00<00:00, 145.46it/s, loss=0.893]


Epoch [1315/5000]: Train loss: 1.0192, Valid loss: 0.9288


Epoch [1316/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.67it/s, loss=1.15]


Epoch [1316/5000]: Train loss: 1.0302, Valid loss: 0.9157


Epoch [1317/5000]: 100%|██████████| 14/14 [00:00<00:00, 213.37it/s, loss=0.887]


Epoch [1317/5000]: Train loss: 1.0197, Valid loss: 0.9180


Epoch [1318/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.01it/s, loss=0.947]


Epoch [1318/5000]: Train loss: 1.0251, Valid loss: 0.9190


Epoch [1319/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.68it/s, loss=1.03]


Epoch [1319/5000]: Train loss: 1.0267, Valid loss: 0.9171


Epoch [1320/5000]: 100%|██████████| 14/14 [00:00<00:00, 213.13it/s, loss=0.869]


Epoch [1320/5000]: Train loss: 1.0190, Valid loss: 0.9154


Epoch [1321/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.15it/s, loss=1.1]


Epoch [1321/5000]: Train loss: 1.0323, Valid loss: 0.9205


Epoch [1322/5000]: 100%|██████████| 14/14 [00:00<00:00, 211.48it/s, loss=1.02]


Epoch [1322/5000]: Train loss: 1.0351, Valid loss: 0.9177


Epoch [1323/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.12it/s, loss=0.91]


Epoch [1323/5000]: Train loss: 1.0244, Valid loss: 0.9182


Epoch [1324/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.92it/s, loss=0.889]


Epoch [1324/5000]: Train loss: 1.0174, Valid loss: 0.9391


Epoch [1325/5000]: 100%|██████████| 14/14 [00:00<00:00, 175.55it/s, loss=1.06]


Epoch [1325/5000]: Train loss: 1.0406, Valid loss: 0.9834


Epoch [1326/5000]: 100%|██████████| 14/14 [00:00<00:00, 181.89it/s, loss=0.867]


Epoch [1326/5000]: Train loss: 1.0187, Valid loss: 0.9219


Epoch [1327/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.59it/s, loss=1.09]


Epoch [1327/5000]: Train loss: 1.0335, Valid loss: 0.9208


Epoch [1328/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.98it/s, loss=1.07]


Epoch [1328/5000]: Train loss: 1.0312, Valid loss: 0.9088


Epoch [1329/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.68it/s, loss=0.929]


Epoch [1329/5000]: Train loss: 1.0321, Valid loss: 0.9579


Epoch [1330/5000]: 100%|██████████| 14/14 [00:00<00:00, 189.28it/s, loss=1.03]


Epoch [1330/5000]: Train loss: 1.0306, Valid loss: 0.9174


Epoch [1331/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.40it/s, loss=0.968]


Epoch [1331/5000]: Train loss: 1.0271, Valid loss: 0.9271


Epoch [1332/5000]: 100%|██████████| 14/14 [00:00<00:00, 182.48it/s, loss=0.875]


Epoch [1332/5000]: Train loss: 1.0230, Valid loss: 0.9502


Epoch [1333/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.06it/s, loss=0.952]


Epoch [1333/5000]: Train loss: 1.0248, Valid loss: 0.9077


Epoch [1334/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.79it/s, loss=1.03]


Epoch [1334/5000]: Train loss: 1.0304, Valid loss: 0.9357


Epoch [1335/5000]: 100%|██████████| 14/14 [00:00<00:00, 213.03it/s, loss=0.996]


Epoch [1335/5000]: Train loss: 1.0304, Valid loss: 0.9439


Epoch [1336/5000]: 100%|██████████| 14/14 [00:00<00:00, 171.26it/s, loss=0.978]


Epoch [1336/5000]: Train loss: 1.0222, Valid loss: 0.9286


Epoch [1337/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.01it/s, loss=0.928]


Epoch [1337/5000]: Train loss: 1.0324, Valid loss: 0.9382


Epoch [1338/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.85it/s, loss=0.995]


Epoch [1338/5000]: Train loss: 1.0257, Valid loss: 0.9418


Epoch [1339/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.01it/s, loss=1.05]


Epoch [1339/5000]: Train loss: 1.0289, Valid loss: 0.9124


Epoch [1340/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.47it/s, loss=0.932]


Epoch [1340/5000]: Train loss: 1.0263, Valid loss: 0.9329


Epoch [1341/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.14it/s, loss=1.11]


Epoch [1341/5000]: Train loss: 1.0352, Valid loss: 1.0082


Epoch [1342/5000]: 100%|██████████| 14/14 [00:00<00:00, 206.18it/s, loss=0.872]


Epoch [1342/5000]: Train loss: 1.0234, Valid loss: 0.9236


Epoch [1343/5000]: 100%|██████████| 14/14 [00:00<00:00, 214.24it/s, loss=1.43]


Epoch [1343/5000]: Train loss: 1.0547, Valid loss: 0.9309


Epoch [1344/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.12it/s, loss=1.07]


Epoch [1344/5000]: Train loss: 1.0385, Valid loss: 0.9738


Epoch [1345/5000]: 100%|██████████| 14/14 [00:00<00:00, 179.84it/s, loss=1.13]


Epoch [1345/5000]: Train loss: 1.0344, Valid loss: 0.9130


Epoch [1346/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.76it/s, loss=0.994]


Epoch [1346/5000]: Train loss: 1.0249, Valid loss: 0.9255


Epoch [1347/5000]: 100%|██████████| 14/14 [00:00<00:00, 213.12it/s, loss=1.11]


Epoch [1347/5000]: Train loss: 1.0328, Valid loss: 0.9208


Epoch [1348/5000]: 100%|██████████| 14/14 [00:00<00:00, 217.06it/s, loss=0.99]


Epoch [1348/5000]: Train loss: 1.0243, Valid loss: 0.9234


Epoch [1349/5000]: 100%|██████████| 14/14 [00:00<00:00, 213.34it/s, loss=1.04]


Epoch [1349/5000]: Train loss: 1.0264, Valid loss: 0.9190


Epoch [1350/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.78it/s, loss=1.04]


Epoch [1350/5000]: Train loss: 1.0288, Valid loss: 0.9242


Epoch [1351/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.76it/s, loss=1.06]


Epoch [1351/5000]: Train loss: 1.0282, Valid loss: 0.9277


Epoch [1352/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.94it/s, loss=0.953]


Epoch [1352/5000]: Train loss: 1.0236, Valid loss: 0.9327


Epoch [1353/5000]: 100%|██████████| 14/14 [00:00<00:00, 209.30it/s, loss=1.34]


Epoch [1353/5000]: Train loss: 1.0469, Valid loss: 0.9131


Epoch [1354/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.44it/s, loss=1.09]


Epoch [1354/5000]: Train loss: 1.0352, Valid loss: 0.9853


Epoch [1355/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.34it/s, loss=1.03]


Epoch [1355/5000]: Train loss: 1.0338, Valid loss: 0.9236


Epoch [1356/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.88it/s, loss=1.3]


Epoch [1356/5000]: Train loss: 1.0398, Valid loss: 0.9390


Epoch [1357/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.31it/s, loss=1.03]


Epoch [1357/5000]: Train loss: 1.0234, Valid loss: 0.9293


Epoch [1358/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.03it/s, loss=1.07]


Epoch [1358/5000]: Train loss: 1.0384, Valid loss: 0.9244


Epoch [1359/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.32it/s, loss=0.736]


Epoch [1359/5000]: Train loss: 1.0273, Valid loss: 0.9563


Epoch [1360/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.29it/s, loss=1.03]


Epoch [1360/5000]: Train loss: 1.0406, Valid loss: 0.9726


Epoch [1361/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.94it/s, loss=1.33]


Epoch [1361/5000]: Train loss: 1.0441, Valid loss: 0.9274


Epoch [1362/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.21it/s, loss=1.22]


Epoch [1362/5000]: Train loss: 1.0361, Valid loss: 0.9308


Epoch [1363/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.04it/s, loss=1.41]


Epoch [1363/5000]: Train loss: 1.0439, Valid loss: 0.9517


Epoch [1364/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.92it/s, loss=0.988]


Epoch [1364/5000]: Train loss: 1.0277, Valid loss: 0.9238


Epoch [1365/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.38it/s, loss=1.05]


Epoch [1365/5000]: Train loss: 1.0294, Valid loss: 0.9234


Epoch [1366/5000]: 100%|██████████| 14/14 [00:00<00:00, 205.63it/s, loss=0.961]


Epoch [1366/5000]: Train loss: 1.0337, Valid loss: 1.0053


Epoch [1367/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.29it/s, loss=1.34]


Epoch [1367/5000]: Train loss: 1.0589, Valid loss: 0.9330


Epoch [1368/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.59it/s, loss=1.35]


Epoch [1368/5000]: Train loss: 1.0428, Valid loss: 0.9280


Epoch [1369/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.15it/s, loss=1.11]


Epoch [1369/5000]: Train loss: 1.0368, Valid loss: 1.0242


Epoch [1370/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.79it/s, loss=0.928]


Epoch [1370/5000]: Train loss: 1.0322, Valid loss: 0.9404


Epoch [1371/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.82it/s, loss=1.03]


Epoch [1371/5000]: Train loss: 1.0312, Valid loss: 0.9207


Epoch [1372/5000]: 100%|██████████| 14/14 [00:00<00:00, 207.44it/s, loss=1.04]


Epoch [1372/5000]: Train loss: 1.0283, Valid loss: 0.9339


Epoch [1373/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.88it/s, loss=1.25]


Epoch [1373/5000]: Train loss: 1.0375, Valid loss: 0.9174


Epoch [1374/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.56it/s, loss=0.834]


Epoch [1374/5000]: Train loss: 1.0161, Valid loss: 0.9260


Epoch [1375/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.02it/s, loss=1.02]


Epoch [1375/5000]: Train loss: 1.0247, Valid loss: 0.9361


Epoch [1376/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.97it/s, loss=0.904]


Epoch [1376/5000]: Train loss: 1.0226, Valid loss: 0.9222


Epoch [1377/5000]: 100%|██████████| 14/14 [00:00<00:00, 180.46it/s, loss=1.04]


Epoch [1377/5000]: Train loss: 1.0312, Valid loss: 0.9505


Epoch [1378/5000]: 100%|██████████| 14/14 [00:00<00:00, 193.53it/s, loss=0.928]


Epoch [1378/5000]: Train loss: 1.0220, Valid loss: 0.9113


Epoch [1379/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.95it/s, loss=0.922]


Epoch [1379/5000]: Train loss: 1.0207, Valid loss: 0.9162


Epoch [1380/5000]: 100%|██████████| 14/14 [00:00<00:00, 190.82it/s, loss=1.03]


Epoch [1380/5000]: Train loss: 1.0257, Valid loss: 0.9176


Epoch [1381/5000]: 100%|██████████| 14/14 [00:00<00:00, 208.68it/s, loss=1.48]


Epoch [1381/5000]: Train loss: 1.0514, Valid loss: 0.9159


Epoch [1382/5000]: 100%|██████████| 14/14 [00:00<00:00, 204.79it/s, loss=0.935]


Epoch [1382/5000]: Train loss: 1.0228, Valid loss: 0.9261


Epoch [1383/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.13it/s, loss=1.44]


Epoch [1383/5000]: Train loss: 1.0522, Valid loss: 1.0063


Epoch [1384/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.61it/s, loss=1.07]


Epoch [1384/5000]: Train loss: 1.0406, Valid loss: 0.9214


Epoch [1385/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.96it/s, loss=0.984]


Epoch [1385/5000]: Train loss: 1.0226, Valid loss: 0.9222


Epoch [1386/5000]: 100%|██████████| 14/14 [00:00<00:00, 188.51it/s, loss=1.15]


Epoch [1386/5000]: Train loss: 1.0342, Valid loss: 0.9188


Epoch [1387/5000]: 100%|██████████| 14/14 [00:00<00:00, 102.47it/s, loss=1.04] 


Epoch [1387/5000]: Train loss: 1.0316, Valid loss: 0.9128


Epoch [1388/5000]: 100%|██████████| 14/14 [00:00<00:00, 98.27it/s, loss=0.951]


Epoch [1388/5000]: Train loss: 1.0245, Valid loss: 0.9226


Epoch [1389/5000]: 100%|██████████| 14/14 [00:00<00:00, 100.73it/s, loss=1.16]


Epoch [1389/5000]: Train loss: 1.0313, Valid loss: 0.9150


Epoch [1390/5000]: 100%|██████████| 14/14 [00:00<00:00, 102.20it/s, loss=1.24]


Epoch [1390/5000]: Train loss: 1.0391, Valid loss: 0.9252


Epoch [1391/5000]: 100%|██████████| 14/14 [00:00<00:00, 101.07it/s, loss=1.09]


Epoch [1391/5000]: Train loss: 1.0288, Valid loss: 0.9434


Epoch [1392/5000]: 100%|██████████| 14/14 [00:00<00:00, 104.74it/s, loss=1.21]


Epoch [1392/5000]: Train loss: 1.0396, Valid loss: 0.9254


Epoch [1393/5000]: 100%|██████████| 14/14 [00:00<00:00, 102.23it/s, loss=0.826]


Epoch [1393/5000]: Train loss: 1.0202, Valid loss: 0.9230


Epoch [1394/5000]: 100%|██████████| 14/14 [00:00<00:00, 114.02it/s, loss=0.96]


Epoch [1394/5000]: Train loss: 1.0228, Valid loss: 0.9216


Epoch [1395/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.69it/s, loss=0.949]


Epoch [1395/5000]: Train loss: 1.0316, Valid loss: 0.9186


Epoch [1396/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.83it/s, loss=0.941]


Epoch [1396/5000]: Train loss: 1.0232, Valid loss: 0.9231


Epoch [1397/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.40it/s, loss=0.86]


Epoch [1397/5000]: Train loss: 1.0352, Valid loss: 0.9655


Epoch [1398/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.58it/s, loss=0.998]


Epoch [1398/5000]: Train loss: 1.0233, Valid loss: 0.9341


Epoch [1399/5000]: 100%|██████████| 14/14 [00:00<00:00, 198.00it/s, loss=0.936]


Epoch [1399/5000]: Train loss: 1.0333, Valid loss: 0.9320


Epoch [1400/5000]: 100%|██████████| 14/14 [00:00<00:00, 199.84it/s, loss=0.879]


Epoch [1400/5000]: Train loss: 1.0307, Valid loss: 0.9243


Epoch [1401/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.74it/s, loss=1.03]


Epoch [1401/5000]: Train loss: 1.0282, Valid loss: 0.9532


Epoch [1402/5000]: 100%|██████████| 14/14 [00:00<00:00, 192.83it/s, loss=1.19]


Epoch [1402/5000]: Train loss: 1.0350, Valid loss: 0.9215


Epoch [1403/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.62it/s, loss=1.02]


Epoch [1403/5000]: Train loss: 1.0254, Valid loss: 0.9368


Epoch [1404/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.46it/s, loss=0.906]


Epoch [1404/5000]: Train loss: 1.0190, Valid loss: 0.9341


Epoch [1405/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.38it/s, loss=0.87]


Epoch [1405/5000]: Train loss: 1.0190, Valid loss: 0.9218


Epoch [1406/5000]: 100%|██████████| 14/14 [00:00<00:00, 197.94it/s, loss=1.37]


Epoch [1406/5000]: Train loss: 1.0384, Valid loss: 0.9243


Epoch [1407/5000]: 100%|██████████| 14/14 [00:00<00:00, 203.87it/s, loss=0.969]


Epoch [1407/5000]: Train loss: 1.0286, Valid loss: 0.9268


Epoch [1408/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.27it/s, loss=0.885]


Epoch [1408/5000]: Train loss: 1.0194, Valid loss: 0.9165


Epoch [1409/5000]: 100%|██████████| 14/14 [00:00<00:00, 201.59it/s, loss=0.965]


Epoch [1409/5000]: Train loss: 1.0275, Valid loss: 0.9611


Epoch [1410/5000]: 100%|██████████| 14/14 [00:00<00:00, 200.39it/s, loss=1.03]


Epoch [1410/5000]: Train loss: 1.0283, Valid loss: 0.9721


Epoch [1411/5000]: 100%|██████████| 14/14 [00:00<00:00, 202.41it/s, loss=1.24]


Epoch [1411/5000]: Train loss: 1.0400, Valid loss: 0.9431


Epoch [1412/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.93it/s, loss=1.04]


Epoch [1412/5000]: Train loss: 1.0237, Valid loss: 0.9185


Epoch [1413/5000]: 100%|██████████| 14/14 [00:00<00:00, 195.92it/s, loss=1.04]


Epoch [1413/5000]: Train loss: 1.0460, Valid loss: 0.9369


Epoch [1414/5000]: 100%|██████████| 14/14 [00:00<00:00, 191.74it/s, loss=1.21]


Epoch [1414/5000]: Train loss: 1.0457, Valid loss: 0.9832


Epoch [1415/5000]: 100%|██████████| 14/14 [00:00<00:00, 184.54it/s, loss=1.13]


Epoch [1415/5000]: Train loss: 1.0458, Valid loss: 0.9378


Epoch [1416/5000]: 100%|██████████| 14/14 [00:00<00:00, 194.14it/s, loss=1.04]

Epoch [1416/5000]: Train loss: 1.0375, Valid loss: 0.9330

Model is not improving, so we halt the training session.





In [343]:
model = My_Model(x_train.shape[1])
model.load_state_dict(torch.load('./models/model.ckpt'))
model

My_Model(
  (layers): Sequential(
    (0): Linear(in_features=17, out_features=16, bias=True)
    (1): ReLU()
    (2): Linear(in_features=16, out_features=8, bias=True)
    (3): ReLU()
    (4): Linear(in_features=8, out_features=1, bias=True)
  )
  (criterion): MSELoss()
)

In [344]:
ans_list=predict(test_loader,model,device)
for i in ans_list:
    print(i)

100%|██████████| 6/6 [00:00<00:00, 818.99it/s]

8.632099
9.617362
5.218893
9.06739
16.748348
14.303404
10.188602
14.515184
13.591484
10.976449
6.813446
9.719425
9.3431635
17.565619
12.318797
6.293479
9.269344
5.5787263
8.107579
9.730932
19.655272
5.938665
9.486419
10.147348
13.794051
18.901451
22.472286
8.691757
7.1962304
15.278135
14.666273
3.9945574
11.777687
9.161927
8.944863
6.362466
13.480566
16.98807
9.615365
13.787729
15.049558
24.901632
5.658922
11.033492
23.81338
22.165157
17.42175
5.3990493
10.783366
6.271143
4.384781
8.374525
14.517724
16.278423
16.931906
19.469172
16.642149
10.991684
24.85467
8.382032
18.198847
19.252989
12.041155
17.025702
20.353592
12.915014
10.4307165
6.1995497
6.8477564
15.974709
21.677483
19.172342
6.04385
11.404367
17.76888
14.192119
16.392694
12.897686
10.103641
16.56702
22.88391
6.007495
22.80577
17.017399
23.331217
9.535613
9.761043
16.025211
26.406115
5.481267
15.336085
15.56584
18.948359
20.934221
21.124323
10.799182
30.732416
8.688182
20.531359
18.632065
18.792353
18.02988
8.618613
16.75842
1




In [15]:
def save_pred(preds, file):
    ''' Save predictions to specified file '''
    with open(file, 'w') as fp:
        writer = csv.writer(fp)
        writer.writerow(['id', 'tested_positive'])
        for i, p in enumerate(preds):
            writer.writerow([i, p])

model = My_Model(input_dim=x_train.shape[1]).to(device)
model.load_state_dict(torch.load(config['save_path']))
preds = predict(test_loader, model, device) 
save_pred(preds, 'pred.csv')         

/bin/bash: kaggle: command not found
