# **Homework 1: COVID-19 Cases Prediction (Regression)**

Objectives:
* Solve a regression problem with deep neural networks (DNN).
* Understand basic DNN training tips.
* Familiarize yourself with PyTorch.

If you have any questions, please contact the TAs via TA hours, NTU COOL, or email to mlta-2022-spring@googlegroups.com

# Download data
If the Google Drive links below do not work, you can download data from [Kaggle](https://www.kaggle.com/t/a3ebd5b5542f0f55e828d4f00de8e59a), and upload data manually to the workspace.

In [1]:
# !gdown --id '1kLSW_-cW2Huj7bh84YTdimGBOJaODiOS' --output covid.train.csv
# !gdown --id '1iiI5qROrAhZn-o4FPqsE97bMzDEFvIdg' --output covid.test.csv

# Import packages

In [2]:
# Numerical Operations
import math
import numpy as np

# Reading/Writing Data
import pandas as pd
import os
import csv

# For Progress Bar
from tqdm import tqdm

# Pytorch
import torch 
import torch.nn as nn
from torch.utils.data import Dataset, DataLoader, random_split
from torch.backends import cudnn

# For plotting learning curve
from torch.utils.tensorboard import SummaryWriter

# Some Utility Functions

You do not need to modify this part.

In [3]:
def same_seed(seed): 
    '''Fixes random number generator seeds for reproducibility.'''
    torch.backends.cudnn.deterministic = True
    torch.backends.cudnn.benchmark = False
    np.random.seed(seed)
    torch.manual_seed(seed)
    if torch.cuda.is_available():
        torch.cuda.manual_seed_all(seed)

def train_valid_split(data_set, valid_ratio, seed):
    '''Split provided training data into training set and validation set'''
    valid_set_size = int(valid_ratio * len(data_set)) 
    train_set_size = len(data_set) - valid_set_size
    train_set, valid_set = random_split(data_set, [train_set_size, valid_set_size], generator=torch.Generator().manual_seed(seed))
    return np.array(train_set), np.array(valid_set)

def predict(test_loader, model, device):
    model.eval() # Set your model to evaluation mode.
    preds = []
    for x in tqdm(test_loader):
        x = x.to(device)                        
        with torch.no_grad():                   
            pred = model(x)                     
            preds.append(pred.detach().cpu())   
    preds = torch.cat(preds, dim=0).numpy()  
    return preds

# Dataset

In [4]:
class COVID19Dataset(Dataset):
    '''
    x: Features.
    y: Targets, if none, do prediction.
    '''
    def __init__(self, x, y=None):
        if y is None:
            self.y = y
        else:
            self.y = torch.FloatTensor(y)
        self.x = torch.FloatTensor(x)

    def __getitem__(self, idx):
        if self.y is None:
            return self.x[idx]
        else:
            return self.x[idx], self.y[idx]

    def __len__(self):
        return len(self.x)

# Neural Network Model
Try out different model architectures by modifying the class below.

In [5]:
class My_Model(nn.Module):
    def __init__(self, input_dim):
        super(My_Model, self).__init__()
        # TODO: modify model's structure, be aware of dimensions. 
        self.layers = nn.Sequential(
            nn.Linear(input_dim, 16),
            nn.ReLU(),
            nn.Linear(16, 8),
            nn.ReLU(),
            nn.Linear(8, 1)
        )

    def forward(self, x):
        x = self.layers(x)
        x = x.squeeze(1) # (B, 1) -> (B)
        return x

# Feature Selection
Choose features you deem useful by modifying the function below.

In [6]:
def select_feat(train_data, valid_data, test_data, select_all=True):
    '''Selects useful features to perform regression'''
    y_train, y_valid = train_data[:,-1], valid_data[:,-1]
    raw_x_train, raw_x_valid, raw_x_test = train_data[:,:-1], valid_data[:,:-1], test_data

    if select_all:
        feat_idx = list(range(raw_x_train.shape[1]))
    else:
        feat_idx = np.concatenate((np.arange(1, 38), np.arange(38, 43), np.arange(53, 59),
                                   np.arange(69, 75), np.arange(85, 91), np.arange(101, 107))) \
            # TODO: Select suitable feature columns.

    return raw_x_train[:,feat_idx], raw_x_valid[:,feat_idx], raw_x_test[:,feat_idx], y_train, y_valid

# Training Loop

In [7]:
def trainer(train_loader, valid_loader, model, config, device):

    criterion = nn.MSELoss(reduction='mean') # Define your loss function, do not modify this.

    # Define your optimization algorithm. 
    # TODO: Please check https://pytorch.org/docs/stable/optim.html to get more available algorithms.
    # TODO: L2 regularization (optimizer(weight decay...) or implement by your self).
    optimizer = torch.optim.Adam(model.parameters(), lr=config['learning_rate']) 
    # optimizer = torch.optim.SGD(model.parameters(), lr=config['learning_rate'], momentum=0.9) 

    writer = SummaryWriter() # Writer of tensoboard.

    if not os.path.isdir('./models'):
        os.mkdir('./models') # Create directory of saving models.

    n_epochs, best_loss, step, early_stop_count = config['n_epochs'], math.inf, 0, 0

    for epoch in range(n_epochs):
        model.train() # Set your model to train mode.
        loss_record = []

        # tqdm is a package to visualize your training progress.
        train_pbar = tqdm(train_loader, position=0, leave=True)
        for x, y in train_pbar:
            optimizer.zero_grad()               # Set gradient to zero.
            x, y = x.to(device), y.to(device)   # Move your data to device.
            pred = model(x)
            loss = criterion(pred, y)
            loss.backward()                     # Compute gradient(backpropagation).
            optimizer.step()                    # Update parameters.
            step += 1
            loss_record.append(loss.detach().item())
            
            # Display current epoch number and loss on tqdm progress bar.
            # train_pbar.set_description(f'Epoch [{epoch+1}/{n_epochs}]')
            # train_pbar.set_postfix({'loss': loss.detach().item()})

        mean_train_loss = sum(loss_record)/len(loss_record)
        writer.add_scalar('Loss/train', mean_train_loss, step)

        model.eval() # Set your model to evaluation mode.
        loss_record = []
        for x, y in valid_loader:
            x, y = x.to(device), y.to(device)
            with torch.no_grad():
                pred = model(x)
                loss = criterion(pred, y)

            loss_record.append(loss.item())

        mean_valid_loss = sum(loss_record)/len(loss_record)
        if epoch % 20 == 0:
            print(f'Epoch [{epoch+1}/{n_epochs}]: Train loss: {mean_train_loss:.4f}, Valid loss: {mean_valid_loss:.4f}')
            writer.add_scalar('Loss/valid', mean_valid_loss, step)

        if mean_valid_loss < best_loss:
            best_loss = mean_valid_loss
            torch.save(model.state_dict(), config['save_path']) # Save your best model
            print('Saving model with loss {:.3f}...'.format(best_loss))
            early_stop_count = 0
        else: 
            early_stop_count += 1

        if early_stop_count >= config['early_stop']:
            print('\nModel is not improving, so we halt the training session.')
            return

# Configurations
`config` contains hyper-parameters for training and the path to save your model.

In [8]:
device = 'cuda' if torch.cuda.is_available() else 'cpu'
config = {
    'seed': 5211314,      # Your seed number, you can pick your lucky number. :)
    'select_all': False,   # Whether to use all features.
    'valid_ratio': 0.2,   # validation_size = train_size * valid_ratio
    'n_epochs': 6000,     # Number of epochs.            
    'batch_size': 128, 
    'learning_rate': 1e-5,              
    'early_stop': 400,    # If model has not improved for this many consecutive epochs, stop training.     
    'save_path': './models/model.ckpt'  # Your model will be saved here.
}

# Dataloader
Read data from files and set up training, validation, and testing sets. You do not need to modify this part.

In [9]:
# Set seed for reproducibility
same_seed(config['seed'])


# train_data size: 2699 x 118 (id + 37 states + 16 features x 5 days) 
# test_data size: 1078 x 117 (without last day's positive rate)
train_data, test_data = pd.read_csv('./covid.train.csv').values, pd.read_csv('./covid.test.csv').values
train_data, valid_data = train_valid_split(train_data, config['valid_ratio'], config['seed'])

# Print out the data size.
print(f"""train_data size: {train_data.shape} 
valid_data size: {valid_data.shape} 
test_data size: {test_data.shape}""")

# Select features
x_train, x_valid, x_test, y_train, y_valid = select_feat(train_data, valid_data, test_data, config['select_all'])

# Print out the number of features.
print(f'number of features: {x_train.shape[1]}')

train_dataset, valid_dataset, test_dataset = COVID19Dataset(x_train, y_train), \
                                            COVID19Dataset(x_valid, y_valid), \
                                            COVID19Dataset(x_test)

# Pytorch data loader loads pytorch dataset into batches.
train_loader = DataLoader(train_dataset, batch_size=config['batch_size'], shuffle=True, pin_memory=True)
valid_loader = DataLoader(valid_dataset, batch_size=config['batch_size'], shuffle=True, pin_memory=True)
test_loader = DataLoader(test_dataset, batch_size=config['batch_size'], shuffle=False, pin_memory=True)

train_data size: (2160, 118) 
valid_data size: (539, 118) 
test_data size: (1078, 117)
number of features: 66


# Start training!

In [None]:
model = My_Model(input_dim=x_train.shape[1]).to(device) # put your model and data on the same computation device.
trainer(train_loader, valid_loader, model, config, device)

100%|██████████| 17/17 [00:01<00:00, 12.43it/s]


Epoch [1/6000]: Train loss: 157.0271, Valid loss: 164.6660
Saving model with loss 164.666...


100%|██████████| 17/17 [00:00<00:00, 682.13it/s]


Saving model with loss 157.856...


100%|██████████| 17/17 [00:00<00:00, 682.30it/s]
100%|██████████| 17/17 [00:00<00:00, 710.72it/s]


Saving model with loss 150.464...


100%|██████████| 17/17 [00:00<00:00, 668.70it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.64it/s]


Saving model with loss 142.408...


100%|██████████| 17/17 [00:00<00:00, 730.07it/s]
100%|██████████| 17/17 [00:00<00:00, 775.34it/s]
100%|██████████| 17/17 [00:00<00:00, 775.32it/s]
100%|██████████| 17/17 [00:00<00:00, 741.62it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 775.30it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 741.56it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]


Saving model with loss 140.448...


100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 775.31it/s]


Epoch [21/6000]: Train loss: 145.4581, Valid loss: 145.7254


100%|██████████| 17/17 [00:00<00:00, 722.31it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 775.32it/s]


Saving model with loss 137.087...


100%|██████████| 17/17 [00:00<00:00, 741.58it/s]
100%|██████████| 17/17 [00:00<00:00, 741.58it/s]
100%|██████████| 17/17 [00:00<00:00, 741.59it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.67it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 710.72it/s]


Saving model with loss 133.564...


100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 775.32it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.68it/s]
100%|██████████| 17/17 [00:00<00:00, 775.30it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 775.34it/s]


Saving model with loss 133.105...


100%|██████████| 17/17 [00:00<00:00, 682.29it/s]


Epoch [41/6000]: Train loss: 136.0885, Valid loss: 135.2835


100%|██████████| 17/17 [00:00<00:00, 741.59it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]


Saving model with loss 131.598...


100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 775.31it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 775.32it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]


Saving model with loss 126.092...


100%|██████████| 17/17 [00:00<00:00, 741.48it/s]


Saving model with loss 125.731...


100%|██████████| 17/17 [00:00<00:00, 741.58it/s]
100%|██████████| 17/17 [00:00<00:00, 741.62it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 812.23it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]


Saving model with loss 122.259...


100%|██████████| 17/17 [00:00<00:00, 741.59it/s]
100%|██████████| 17/17 [00:00<00:00, 710.53it/s]
100%|██████████| 17/17 [00:00<00:00, 710.72it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]


Epoch [61/6000]: Train loss: 127.3346, Valid loss: 126.1981


100%|██████████| 17/17 [00:00<00:00, 775.33it/s]


Saving model with loss 117.528...


100%|██████████| 17/17 [00:00<00:00, 741.62it/s]
100%|██████████| 17/17 [00:00<00:00, 682.26it/s]
100%|██████████| 17/17 [00:00<00:00, 778.62it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 812.25it/s]
100%|██████████| 17/17 [00:00<00:00, 812.24it/s]
100%|██████████| 17/17 [00:00<00:00, 775.32it/s]
100%|██████████| 17/17 [00:00<00:00, 741.63it/s]


Saving model with loss 115.508...


100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 812.24it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 812.23it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.62it/s]
100%|██████████| 17/17 [00:00<00:00, 775.33it/s]
100%|██████████| 17/17 [00:00<00:00, 741.59it/s]


Epoch [81/6000]: Train loss: 118.9196, Valid loss: 110.2030
Saving model with loss 110.203...


100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 741.59it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 775.31it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]


Saving model with loss 107.134...


100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 775.30it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 775.32it/s]
100%|██████████| 17/17 [00:00<00:00, 775.33it/s]


Saving model with loss 106.398...


100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 775.32it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]


Epoch [101/6000]: Train loss: 109.8928, Valid loss: 114.7801


100%|██████████| 17/17 [00:00<00:00, 741.59it/s]


Saving model with loss 103.726...


100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 775.22it/s]


Saving model with loss 102.643...


100%|██████████| 17/17 [00:00<00:00, 741.61it/s]


Saving model with loss 102.550...


100%|██████████| 17/17 [00:00<00:00, 682.26it/s]
100%|██████████| 17/17 [00:00<00:00, 741.54it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 775.32it/s]
100%|██████████| 17/17 [00:00<00:00, 775.31it/s]
100%|██████████| 17/17 [00:00<00:00, 741.14it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]


Saving model with loss 98.056...


100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 812.23it/s]


Saving model with loss 95.371...


100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 775.30it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 775.32it/s]
100%|██████████| 17/17 [00:00<00:00, 722.94it/s]
100%|██████████| 17/17 [00:00<00:00, 775.30it/s]


Epoch [121/6000]: Train loss: 101.0596, Valid loss: 102.1553


100%|██████████| 17/17 [00:00<00:00, 741.63it/s]
100%|██████████| 17/17 [00:00<00:00, 775.25it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 741.54it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 775.31it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]


Saving model with loss 94.863...


100%|██████████| 17/17 [00:00<00:00, 668.75it/s]


Saving model with loss 90.310...


100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 725.67it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 656.14it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]


Saving model with loss 89.213...


100%|██████████| 17/17 [00:00<00:00, 696.03it/s]


Saving model with loss 88.666...


100%|██████████| 17/17 [00:00<00:00, 775.32it/s]


Epoch [141/6000]: Train loss: 91.8118, Valid loss: 89.0745


100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 350.44it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]


Saving model with loss 86.412...


100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 328.02it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 328.02it/s]
100%|██████████| 17/17 [00:00<00:00, 310.13it/s]


Saving model with loss 85.669...


100%|██████████| 17/17 [00:00<00:00, 328.01it/s]


Saving model with loss 85.172...


100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 315.87it/s]


Saving model with loss 82.693...


100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 325.15it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 318.77it/s]
100%|██████████| 17/17 [00:00<00:00, 268.58it/s]


Epoch [161/6000]: Train loss: 82.4923, Valid loss: 75.7788
Saving model with loss 75.779...


100%|██████████| 17/17 [00:00<00:00, 289.08it/s]
100%|██████████| 17/17 [00:00<00:00, 297.24it/s]
100%|██████████| 17/17 [00:00<00:00, 270.71it/s]
100%|██████████| 17/17 [00:00<00:00, 294.09it/s]
100%|██████████| 17/17 [00:00<00:00, 270.73it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 294.07it/s]
100%|██████████| 17/17 [00:00<00:00, 258.44it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]


Saving model with loss 72.598...


100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 291.74it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]


Saving model with loss 72.528...


100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]


Saving model with loss 70.073...


100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]


Epoch [181/6000]: Train loss: 73.0448, Valid loss: 74.6246


100%|██████████| 17/17 [00:00<00:00, 289.10it/s]


Saving model with loss 69.063...


100%|██████████| 17/17 [00:00<00:00, 281.15it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]


Saving model with loss 66.336...


100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 291.32it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 289.07it/s]


Saving model with loss 65.391...


100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 304.58it/s]
100%|██████████| 17/17 [00:00<00:00, 306.65it/s]
100%|██████████| 17/17 [00:00<00:00, 299.22it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 268.57it/s]


Saving model with loss 63.818...


100%|██████████| 17/17 [00:00<00:00, 296.59it/s]
100%|██████████| 17/17 [00:00<00:00, 301.86it/s]
100%|██████████| 17/17 [00:00<00:00, 254.58it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]


Epoch [201/6000]: Train loss: 63.8139, Valid loss: 65.3283


100%|██████████| 17/17 [00:00<00:00, 289.09it/s]


Saving model with loss 61.305...


100%|██████████| 17/17 [00:00<00:00, 289.10it/s]


Saving model with loss 61.080...


100%|██████████| 17/17 [00:00<00:00, 288.82it/s]
100%|██████████| 17/17 [00:00<00:00, 285.02it/s]


Saving model with loss 58.714...


100%|██████████| 17/17 [00:00<00:00, 282.15it/s]
100%|██████████| 17/17 [00:00<00:00, 260.17it/s]
100%|██████████| 17/17 [00:00<00:00, 234.75it/s]
100%|██████████| 17/17 [00:00<00:00, 286.59it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]


Saving model with loss 55.042...


100%|██████████| 17/17 [00:00<00:00, 268.52it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 284.42it/s]
100%|██████████| 17/17 [00:00<00:00, 288.81it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 270.72it/s]


Saving model with loss 54.713...


100%|██████████| 17/17 [00:00<00:00, 266.27it/s]
100%|██████████| 17/17 [00:00<00:00, 275.87it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]


Epoch [221/6000]: Train loss: 55.2768, Valid loss: 53.2118
Saving model with loss 53.212...


100%|██████████| 17/17 [00:00<00:00, 289.09it/s]
100%|██████████| 17/17 [00:00<00:00, 250.83it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 281.88it/s]
100%|██████████| 17/17 [00:00<00:00, 296.60it/s]


Saving model with loss 52.112...


100%|██████████| 17/17 [00:00<00:00, 275.11it/s]


Saving model with loss 50.930...


100%|██████████| 17/17 [00:00<00:00, 199.47it/s]
100%|██████████| 17/17 [00:00<00:00, 243.67it/s]


Saving model with loss 47.959...


100%|██████████| 17/17 [00:00<00:00, 279.61it/s]
100%|██████████| 17/17 [00:00<00:00, 247.17it/s]


Saving model with loss 47.536...


100%|██████████| 17/17 [00:00<00:00, 250.84it/s]
100%|██████████| 17/17 [00:00<00:00, 270.75it/s]
100%|██████████| 17/17 [00:00<00:00, 247.10it/s]


Saving model with loss 47.355...


100%|██████████| 17/17 [00:00<00:00, 289.20it/s]
100%|██████████| 17/17 [00:00<00:00, 200.77it/s]
100%|██████████| 17/17 [00:00<00:00, 236.90it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]


Saving model with loss 45.686...


100%|██████████| 17/17 [00:00<00:00, 277.91it/s]


Saving model with loss 45.509...


100%|██████████| 17/17 [00:00<00:00, 294.09it/s]


Epoch [241/6000]: Train loss: 47.3879, Valid loss: 47.7937


100%|██████████| 17/17 [00:00<00:00, 299.24it/s]


Saving model with loss 44.707...


100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 304.58it/s]
100%|██████████| 17/17 [00:00<00:00, 299.08it/s]
100%|██████████| 17/17 [00:00<00:00, 296.60it/s]


Saving model with loss 43.892...


100%|██████████| 17/17 [00:00<00:00, 294.08it/s]


Saving model with loss 42.585...


100%|██████████| 17/17 [00:00<00:00, 230.49it/s]
100%|██████████| 17/17 [00:00<00:00, 208.01it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]


Saving model with loss 42.491...


100%|██████████| 17/17 [00:00<00:00, 286.99it/s]
100%|██████████| 17/17 [00:00<00:00, 295.77it/s]
100%|██████████| 17/17 [00:00<00:00, 299.25it/s]
100%|██████████| 17/17 [00:00<00:00, 294.07it/s]
100%|██████████| 17/17 [00:00<00:00, 299.20it/s]


Saving model with loss 41.721...


100%|██████████| 17/17 [00:00<00:00, 301.67it/s]


Saving model with loss 39.927...


100%|██████████| 17/17 [00:00<00:00, 294.24it/s]
100%|██████████| 17/17 [00:00<00:00, 291.53it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]


Saving model with loss 38.939...


100%|██████████| 17/17 [00:00<00:00, 296.59it/s]


Epoch [261/6000]: Train loss: 40.4609, Valid loss: 43.2580


100%|██████████| 17/17 [00:00<00:00, 291.53it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 310.13it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]


Saving model with loss 38.005...


100%|██████████| 17/17 [00:00<00:00, 299.24it/s]


Saving model with loss 37.049...


100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]


Saving model with loss 36.967...


100%|██████████| 17/17 [00:00<00:00, 304.04it/s]


Saving model with loss 33.876...


100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 304.13it/s]
100%|██████████| 17/17 [00:00<00:00, 294.45it/s]
100%|██████████| 17/17 [00:00<00:00, 301.94it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]


Saving model with loss 31.769...


100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 295.69it/s]
100%|██████████| 17/17 [00:00<00:00, 312.93it/s]


Epoch [281/6000]: Train loss: 34.6023, Valid loss: 32.5212


100%|██████████| 17/17 [00:00<00:00, 299.25it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 315.84it/s]
100%|██████████| 17/17 [00:00<00:00, 290.83it/s]
100%|██████████| 17/17 [00:00<00:00, 286.37it/s]


Saving model with loss 31.635...


100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]


Saving model with loss 31.268...


100%|██████████| 17/17 [00:00<00:00, 277.02it/s]
100%|██████████| 17/17 [00:00<00:00, 282.24it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]


Saving model with loss 29.912...


100%|██████████| 17/17 [00:00<00:00, 289.09it/s]
100%|██████████| 17/17 [00:00<00:00, 266.49it/s]
100%|██████████| 17/17 [00:00<00:00, 294.06it/s]


Saving model with loss 29.691...


100%|██████████| 17/17 [00:00<00:00, 295.16it/s]
100%|██████████| 17/17 [00:00<00:00, 296.59it/s]
100%|██████████| 17/17 [00:00<00:00, 272.87it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]


Saving model with loss 27.653...


100%|██████████| 17/17 [00:00<00:00, 289.09it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 289.09it/s]


Epoch [301/6000]: Train loss: 29.5351, Valid loss: 29.9373


100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 290.18it/s]
100%|██████████| 17/17 [00:00<00:00, 265.49it/s]


Saving model with loss 27.141...


100%|██████████| 17/17 [00:00<00:00, 258.43it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 270.62it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]


Saving model with loss 26.529...


100%|██████████| 17/17 [00:00<00:00, 279.34it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 285.57it/s]
100%|██████████| 17/17 [00:00<00:00, 279.60it/s]


Saving model with loss 25.852...


100%|██████████| 17/17 [00:00<00:00, 279.61it/s]
100%|██████████| 17/17 [00:00<00:00, 290.74it/s]
100%|██████████| 17/17 [00:00<00:00, 281.71it/s]


Saving model with loss 25.018...


100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]


Saving model with loss 24.952...


100%|██████████| 17/17 [00:00<00:00, 270.61it/s]


Epoch [321/6000]: Train loss: 25.4702, Valid loss: 25.3327


100%|██████████| 17/17 [00:00<00:00, 281.89it/s]
100%|██████████| 17/17 [00:00<00:00, 291.81it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 291.52it/s]


Saving model with loss 24.077...


100%|██████████| 17/17 [00:00<00:00, 286.64it/s]


Saving model with loss 22.990...


100%|██████████| 17/17 [00:00<00:00, 275.86it/s]
100%|██████████| 17/17 [00:00<00:00, 286.62it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]


Saving model with loss 22.103...


100%|██████████| 17/17 [00:00<00:00, 254.58it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]


Saving model with loss 19.796...


100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]


Epoch [341/6000]: Train loss: 22.1340, Valid loss: 22.7254


100%|██████████| 17/17 [00:00<00:00, 283.27it/s]
100%|██████████| 17/17 [00:00<00:00, 277.26it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 255.15it/s]
100%|██████████| 17/17 [00:00<00:00, 91.52it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 315.29it/s]
100%|██████████| 17/17 [00:00<00:00, 321.82it/s]


Saving model with loss 19.034...


100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 325.99it/s]
100%|██████████| 17/17 [00:00<00:00, 328.02it/s]
100%|██████████| 17/17 [00:00<00:00, 330.70it/s]
100%|██████████| 17/17 [00:00<00:00, 327.51it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 331.15it/s]


Saving model with loss 19.021...


100%|██████████| 17/17 [00:00<00:00, 328.01it/s]


Saving model with loss 18.858...


100%|██████████| 17/17 [00:00<00:00, 327.20it/s]
100%|██████████| 17/17 [00:00<00:00, 328.02it/s]
100%|██████████| 17/17 [00:00<00:00, 321.82it/s]
100%|██████████| 17/17 [00:00<00:00, 328.01it/s]


Epoch [361/6000]: Train loss: 19.4789, Valid loss: 18.8114
Saving model with loss 18.811...


100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 315.87it/s]
100%|██████████| 17/17 [00:00<00:00, 321.82it/s]
100%|██████████| 17/17 [00:00<00:00, 328.01it/s]
100%|██████████| 17/17 [00:00<00:00, 328.01it/s]


Saving model with loss 18.250...


100%|██████████| 17/17 [00:00<00:00, 328.01it/s]


Saving model with loss 18.130...


100%|██████████| 17/17 [00:00<00:00, 321.82it/s]
100%|██████████| 17/17 [00:00<00:00, 328.01it/s]
100%|██████████| 17/17 [00:00<00:00, 328.01it/s]

Saving model with loss 17.185...



100%|██████████| 17/17 [00:00<00:00, 328.02it/s]
100%|██████████| 17/17 [00:00<00:00, 323.64it/s]
100%|██████████| 17/17 [00:00<00:00, 330.59it/s]
100%|██████████| 17/17 [00:00<00:00, 328.00it/s]


Saving model with loss 16.328...


100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 321.80it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 315.84it/s]
100%|██████████| 17/17 [00:00<00:00, 328.02it/s]


Epoch [381/6000]: Train loss: 17.2976, Valid loss: 17.1844


100%|██████████| 17/17 [00:00<00:00, 312.88it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 325.24it/s]
100%|██████████| 17/17 [00:00<00:00, 315.87it/s]


Saving model with loss 15.742...


100%|██████████| 17/17 [00:00<00:00, 318.77it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 321.82it/s]
100%|██████████| 17/17 [00:00<00:00, 321.82it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]


Saving model with loss 15.693...


100%|██████████| 17/17 [00:00<00:00, 310.13it/s]


Saving model with loss 15.384...


100%|██████████| 17/17 [00:00<00:00, 315.86it/s]


Saving model with loss 14.836...


100%|██████████| 17/17 [00:00<00:00, 310.13it/s]
100%|██████████| 17/17 [00:00<00:00, 328.02it/s]
100%|██████████| 17/17 [00:00<00:00, 321.80it/s]
100%|██████████| 17/17 [00:00<00:00, 321.82it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 328.02it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 328.02it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]


Epoch [401/6000]: Train loss: 15.6781, Valid loss: 14.8062
Saving model with loss 14.806...


100%|██████████| 17/17 [00:00<00:00, 286.63it/s]
100%|██████████| 17/17 [00:00<00:00, 286.64it/s]


Saving model with loss 14.126...


100%|██████████| 17/17 [00:00<00:00, 299.25it/s]
100%|██████████| 17/17 [00:00<00:00, 289.17it/s]
100%|██████████| 17/17 [00:00<00:00, 280.24it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 299.22it/s]
100%|██████████| 17/17 [00:00<00:00, 272.88it/s]
100%|██████████| 17/17 [00:00<00:00, 270.73it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 301.84it/s]
100%|██████████| 17/17 [00:00<00:00, 304.58it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 307.28it/s]


Saving model with loss 13.683...


100%|██████████| 17/17 [00:00<00:00, 282.67it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]


Epoch [421/6000]: Train loss: 14.2827, Valid loss: 13.9244


100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 296.27it/s]
100%|██████████| 17/17 [00:00<00:00, 310.13it/s]


Saving model with loss 13.337...


100%|██████████| 17/17 [00:00<00:00, 250.84it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]


Saving model with loss 12.884...


100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 289.09it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]


Saving model with loss 12.707...


100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 285.22it/s]


Saving model with loss 12.644...


100%|██████████| 17/17 [00:00<00:00, 266.50it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 301.32it/s]


Saving model with loss 12.358...


100%|██████████| 17/17 [00:00<00:00, 270.75it/s]


Saving model with loss 12.351...


100%|██████████| 17/17 [00:00<00:00, 289.08it/s]
100%|██████████| 17/17 [00:00<00:00, 304.58it/s]


Epoch [441/6000]: Train loss: 12.9913, Valid loss: 12.2609
Saving model with loss 12.261...


100%|██████████| 17/17 [00:00<00:00, 273.38it/s]
100%|██████████| 17/17 [00:00<00:00, 284.26it/s]
100%|██████████| 17/17 [00:00<00:00, 275.76it/s]
100%|██████████| 17/17 [00:00<00:00, 277.31it/s]
100%|██████████| 17/17 [00:00<00:00, 268.88it/s]


Saving model with loss 12.020...


100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]


Saving model with loss 11.446...


100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 224.43it/s]
100%|██████████| 17/17 [00:00<00:00, 215.91it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 268.05it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 262.42it/s]


Saving model with loss 10.614...


100%|██████████| 17/17 [00:00<00:00, 240.23it/s]
100%|██████████| 17/17 [00:00<00:00, 277.31it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]


Epoch [461/6000]: Train loss: 11.7996, Valid loss: 10.8550


100%|██████████| 17/17 [00:00<00:00, 262.40it/s]
100%|██████████| 17/17 [00:00<00:00, 275.12it/s]
100%|██████████| 17/17 [00:00<00:00, 254.58it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 250.81it/s]
100%|██████████| 17/17 [00:00<00:00, 272.65it/s]
100%|██████████| 17/17 [00:00<00:00, 264.41it/s]


Saving model with loss 10.600...


100%|██████████| 17/17 [00:00<00:00, 258.44it/s]
100%|██████████| 17/17 [00:00<00:00, 281.89it/s]
100%|██████████| 17/17 [00:00<00:00, 259.07it/s]
100%|██████████| 17/17 [00:00<00:00, 263.77it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 279.10it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]


Saving model with loss 10.471...


100%|██████████| 17/17 [00:00<00:00, 275.10it/s]
100%|██████████| 17/17 [00:00<00:00, 290.54it/s]


Saving model with loss 10.129...


100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 268.33it/s]


Saving model with loss 10.123...


100%|██████████| 17/17 [00:00<00:00, 267.37it/s]


Epoch [481/6000]: Train loss: 10.7106, Valid loss: 10.4369


100%|██████████| 17/17 [00:00<00:00, 280.75it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]


Saving model with loss 9.764...


100%|██████████| 17/17 [00:00<00:00, 285.18it/s]
100%|██████████| 17/17 [00:00<00:00, 254.58it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 265.43it/s]
100%|██████████| 17/17 [00:00<00:00, 272.54it/s]
100%|██████████| 17/17 [00:00<00:00, 247.73it/s]


Saving model with loss 9.661...


100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 278.23it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 271.07it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]


Saving model with loss 9.363...


100%|██████████| 17/17 [00:00<00:00, 273.29it/s]
100%|██████████| 17/17 [00:00<00:00, 254.58it/s]
100%|██████████| 17/17 [00:00<00:00, 250.83it/s]


Saving model with loss 8.926...


100%|██████████| 17/17 [00:00<00:00, 205.50it/s]
100%|██████████| 17/17 [00:00<00:00, 222.23it/s]


Epoch [501/6000]: Train loss: 9.7555, Valid loss: 9.6164


100%|██████████| 17/17 [00:00<00:00, 263.60it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]


Saving model with loss 8.762...


100%|██████████| 17/17 [00:00<00:00, 253.05it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 266.49it/s]
100%|██████████| 17/17 [00:00<00:00, 266.52it/s]
100%|██████████| 17/17 [00:00<00:00, 254.58it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 293.98it/s]
100%|██████████| 17/17 [00:00<00:00, 270.75it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]


Saving model with loss 8.447...


100%|██████████| 17/17 [00:00<00:00, 268.30it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 289.09it/s]
100%|██████████| 17/17 [00:00<00:00, 271.67it/s]
100%|██████████| 17/17 [00:00<00:00, 266.24it/s]


Epoch [521/6000]: Train loss: 8.8715, Valid loss: 8.2508
Saving model with loss 8.251...


100%|██████████| 17/17 [00:00<00:00, 279.62it/s]


Saving model with loss 8.247...


100%|██████████| 17/17 [00:00<00:00, 289.09it/s]
100%|██████████| 17/17 [00:00<00:00, 275.10it/s]
100%|██████████| 17/17 [00:00<00:00, 262.91it/s]
100%|██████████| 17/17 [00:00<00:00, 274.36it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 270.75it/s]
100%|██████████| 17/17 [00:00<00:00, 270.73it/s]


Saving model with loss 7.862...


100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 268.58it/s]
100%|██████████| 17/17 [00:00<00:00, 277.30it/s]
100%|██████████| 17/17 [00:00<00:00, 284.27it/s]
100%|██████████| 17/17 [00:00<00:00, 272.88it/s]
100%|██████████| 17/17 [00:00<00:00, 289.08it/s]
100%|██████████| 17/17 [00:00<00:00, 276.30it/s]


Saving model with loss 7.775...


100%|██████████| 17/17 [00:00<00:00, 254.58it/s]
100%|██████████| 17/17 [00:00<00:00, 284.29it/s]
100%|██████████| 17/17 [00:00<00:00, 275.10it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]


Epoch [541/6000]: Train loss: 8.1198, Valid loss: 8.7341


100%|██████████| 17/17 [00:00<00:00, 254.58it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]


Saving model with loss 7.724...


100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]


Saving model with loss 7.197...


100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 279.63it/s]
100%|██████████| 17/17 [00:00<00:00, 290.61it/s]
100%|██████████| 17/17 [00:00<00:00, 279.03it/s]
100%|██████████| 17/17 [00:00<00:00, 279.61it/s]


Saving model with loss 7.111...


100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 262.39it/s]
100%|██████████| 17/17 [00:00<00:00, 211.86it/s]
100%|██████████| 17/17 [00:00<00:00, 176.74it/s]
100%|██████████| 17/17 [00:00<00:00, 199.48it/s]


Epoch [561/6000]: Train loss: 7.5152, Valid loss: 7.3701


100%|██████████| 17/17 [00:00<00:00, 204.25it/s]
100%|██████████| 17/17 [00:00<00:00, 220.07it/s]
100%|██████████| 17/17 [00:00<00:00, 215.91it/s]


Saving model with loss 7.098...


100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 310.88it/s]
100%|██████████| 17/17 [00:00<00:00, 315.86it/s]
100%|██████████| 17/17 [00:00<00:00, 319.78it/s]


Saving model with loss 7.051...


100%|██████████| 17/17 [00:00<00:00, 316.37it/s]
100%|██████████| 17/17 [00:00<00:00, 318.35it/s]
100%|██████████| 17/17 [00:00<00:00, 315.87it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]


Saving model with loss 6.821...


100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 315.86it/s]
100%|██████████| 17/17 [00:00<00:00, 321.82it/s]
100%|██████████| 17/17 [00:00<00:00, 315.87it/s]
100%|██████████| 17/17 [00:00<00:00, 321.82it/s]
100%|██████████| 17/17 [00:00<00:00, 306.94it/s]
100%|██████████| 17/17 [00:00<00:00, 294.28it/s]
100%|██████████| 17/17 [00:00<00:00, 315.86it/s]
100%|██████████| 17/17 [00:00<00:00, 318.76it/s]


Epoch [581/6000]: Train loss: 7.0067, Valid loss: 6.6147
Saving model with loss 6.615...


100%|██████████| 17/17 [00:00<00:00, 312.58it/s]
100%|██████████| 17/17 [00:00<00:00, 319.99it/s]
100%|██████████| 17/17 [00:00<00:00, 315.84it/s]


Saving model with loss 6.292...


100%|██████████| 17/17 [00:00<00:00, 315.87it/s]
100%|██████████| 17/17 [00:00<00:00, 324.67it/s]
100%|██████████| 17/17 [00:00<00:00, 328.02it/s]
100%|██████████| 17/17 [00:00<00:00, 321.82it/s]
100%|██████████| 17/17 [00:00<00:00, 321.82it/s]
100%|██████████| 17/17 [00:00<00:00, 321.83it/s]
100%|██████████| 17/17 [00:00<00:00, 315.87it/s]
100%|██████████| 17/17 [00:00<00:00, 318.77it/s]
100%|██████████| 17/17 [00:00<00:00, 306.63it/s]
100%|██████████| 17/17 [00:00<00:00, 307.13it/s]
100%|██████████| 17/17 [00:00<00:00, 289.11it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 298.42it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 308.64it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]


Epoch [601/6000]: Train loss: 6.6237, Valid loss: 6.5145


100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 448.81it/s]
100%|██████████| 17/17 [00:00<00:00, 416.01it/s]


Saving model with loss 6.240...


100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]


Saving model with loss 6.171...


100%|██████████| 17/17 [00:00<00:00, 473.80it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 416.02it/s]
100%|██████████| 17/17 [00:00<00:00, 370.79it/s]
100%|██████████| 17/17 [00:00<00:00, 568.54it/s]
100%|██████████| 17/17 [00:00<00:00, 550.22it/s]
100%|██████████| 17/17 [00:00<00:00, 516.88it/s]


Saving model with loss 6.163...


100%|██████████| 17/17 [00:00<00:00, 550.21it/s]
100%|██████████| 17/17 [00:00<00:00, 410.93it/s]


Saving model with loss 6.047...


100%|██████████| 17/17 [00:00<00:00, 262.41it/s]


Saving model with loss 6.000...


100%|██████████| 17/17 [00:00<00:00, 240.24it/s]
100%|██████████| 17/17 [00:00<00:00, 243.67it/s]
100%|██████████| 17/17 [00:00<00:00, 291.53it/s]


Epoch [621/6000]: Train loss: 6.3618, Valid loss: 6.2303


100%|██████████| 17/17 [00:00<00:00, 243.52it/s]


Saving model with loss 5.968...


100%|██████████| 17/17 [00:00<00:00, 258.44it/s]
100%|██████████| 17/17 [00:00<00:00, 473.80it/s]
100%|██████████| 17/17 [00:00<00:00, 448.82it/s]
100%|██████████| 17/17 [00:00<00:00, 533.02it/s]
100%|██████████| 17/17 [00:00<00:00, 421.06it/s]


Saving model with loss 5.891...


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 550.21it/s]
100%|██████████| 17/17 [00:00<00:00, 643.50it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]


Saving model with loss 5.881...


100%|██████████| 17/17 [00:00<00:00, 609.17it/s]


Saving model with loss 5.608...


100%|██████████| 17/17 [00:00<00:00, 547.04it/s]
100%|██████████| 17/17 [00:00<00:00, 533.03it/s]
100%|██████████| 17/17 [00:00<00:00, 559.02it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 598.31it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 460.99it/s]
100%|██████████| 17/17 [00:00<00:00, 541.34it/s]


Epoch [641/6000]: Train loss: 6.1382, Valid loss: 6.0402


100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 533.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 631.76it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]


Saving model with loss 5.428...


100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 615.01it/s]
100%|██████████| 17/17 [00:00<00:00, 656.05it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]


Epoch [661/6000]: Train loss: 5.9988, Valid loss: 5.5619


100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 608.44it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 568.57it/s]
100%|██████████| 17/17 [00:00<00:00, 461.01it/s]
100%|██████████| 17/17 [00:00<00:00, 588.18it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 608.20it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 588.18it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]


Epoch [681/6000]: Train loss: 5.8862, Valid loss: 5.7686


100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 662.71it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]


Saving model with loss 5.385...


100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 596.54it/s]
100%|██████████| 17/17 [00:00<00:00, 588.18it/s]
100%|██████████| 17/17 [00:00<00:00, 431.73it/s]
100%|██████████| 17/17 [00:00<00:00, 416.02it/s]
100%|██████████| 17/17 [00:00<00:00, 473.80it/s]
100%|██████████| 17/17 [00:00<00:00, 426.42it/s]
100%|██████████| 17/17 [00:00<00:00, 448.86it/s]
100%|██████████| 17/17 [00:00<00:00, 431.71it/s]
100%|██████████| 17/17 [00:00<00:00, 487.34it/s]
100%|██████████| 17/17 [00:00<00:00, 516.88it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]


Epoch [701/6000]: Train loss: 5.8034, Valid loss: 6.3465


100%|██████████| 17/17 [00:00<00:00, 682.27it/s]


Saving model with loss 5.230...


100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 710.73it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 741.58it/s]
100%|██████████| 17/17 [00:00<00:00, 656.01it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.72it/s]
100%|██████████| 17/17 [00:00<00:00, 741.62it/s]


Epoch [721/6000]: Train loss: 5.6915, Valid loss: 5.7519


100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.26it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.67it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 682.26it/s]
100%|██████████| 17/17 [00:00<00:00, 710.74it/s]
100%|██████████| 17/17 [00:00<00:00, 631.72it/s]
100%|██████████| 17/17 [00:00<00:00, 682.17it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 533.04it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 240.23it/s]
100%|██████████| 17/17 [00:00<00:00, 275.12it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 741.63it/s]
100%|██████████| 17/17 [00:00<00:00, 741.63it/s]


Epoch [741/6000]: Train loss: 5.6072, Valid loss: 5.4449


100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.74it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]


Saving model with loss 5.099...


100%|██████████| 17/17 [00:00<00:00, 706.55it/s]


Saving model with loss 5.004...


100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 710.58it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 620.07it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 620.00it/s]
100%|██████████| 17/17 [00:00<00:00, 710.74it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]


Epoch [761/6000]: Train loss: 5.5334, Valid loss: 5.9607


100%|██████████| 17/17 [00:00<00:00, 631.72it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 682.18it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 682.26it/s]


Saving model with loss 4.839...


100%|██████████| 17/17 [00:00<00:00, 631.76it/s]
100%|██████████| 17/17 [00:00<00:00, 609.19it/s]
100%|██████████| 17/17 [00:00<00:00, 609.20it/s]
100%|██████████| 17/17 [00:00<00:00, 631.76it/s]
100%|██████████| 17/17 [00:00<00:00, 741.59it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 741.59it/s]
100%|██████████| 17/17 [00:00<00:00, 631.72it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 631.76it/s]
100%|██████████| 17/17 [00:00<00:00, 682.31it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]


Epoch [781/6000]: Train loss: 5.4628, Valid loss: 5.7544


100%|██████████| 17/17 [00:00<00:00, 516.88it/s]
100%|██████████| 17/17 [00:00<00:00, 634.43it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 668.77it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 682.22it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 631.68it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.16it/s]
100%|██████████| 17/17 [00:00<00:00, 568.57it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]


Epoch [801/6000]: Train loss: 5.3758, Valid loss: 6.2636


100%|██████████| 17/17 [00:00<00:00, 609.12it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.22it/s]
100%|██████████| 17/17 [00:00<00:00, 620.14it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 563.88it/s]
100%|██████████| 17/17 [00:00<00:00, 631.77it/s]
100%|██████████| 17/17 [00:00<00:00, 588.43it/s]
100%|██████████| 17/17 [00:00<00:00, 584.53it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 656.05it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 588.18it/s]
100%|██████████| 17/17 [00:00<00:00, 588.18it/s]


Epoch [821/6000]: Train loss: 5.2941, Valid loss: 5.6758


100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]


Saving model with loss 4.828...


100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 656.01it/s]


Saving model with loss 4.827...


100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 582.47it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 656.07it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]


Saving model with loss 4.816...


100%|██████████| 17/17 [00:00<00:00, 609.19it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]


Epoch [841/6000]: Train loss: 5.2024, Valid loss: 5.4302


100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]


Saving model with loss 4.809...


100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 563.40it/s]
100%|██████████| 17/17 [00:00<00:00, 609.19it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]


Saving model with loss 4.805...


100%|██████████| 17/17 [00:00<00:00, 588.18it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 562.67it/s]


Saving model with loss 4.578...


100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 609.19it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 573.85it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 576.23it/s]
100%|██████████| 17/17 [00:00<00:00, 589.10it/s]


Epoch [861/6000]: Train loss: 5.1226, Valid loss: 4.6890


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 631.72it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 573.94it/s]
100%|██████████| 17/17 [00:00<00:00, 588.18it/s]
100%|██████████| 17/17 [00:00<00:00, 609.16it/s]
100%|██████████| 17/17 [00:00<00:00, 639.49it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.16it/s]
100%|██████████| 17/17 [00:00<00:00, 588.15it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 487.34it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 516.88it/s]


Epoch [881/6000]: Train loss: 5.0407, Valid loss: 4.9719


100%|██████████| 17/17 [00:00<00:00, 461.00it/s]
100%|██████████| 17/17 [00:00<00:00, 533.03it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 550.23it/s]
100%|██████████| 17/17 [00:00<00:00, 516.88it/s]
100%|██████████| 17/17 [00:00<00:00, 516.88it/s]
100%|██████████| 17/17 [00:00<00:00, 416.02it/s]
100%|██████████| 17/17 [00:00<00:00, 501.67it/s]
100%|██████████| 17/17 [00:00<00:00, 487.34it/s]


Saving model with loss 4.549...


100%|██████████| 17/17 [00:00<00:00, 370.80it/s]
100%|██████████| 17/17 [00:00<00:00, 355.35it/s]
100%|██████████| 17/17 [00:00<00:00, 416.02it/s]
100%|██████████| 17/17 [00:00<00:00, 533.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.76it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 221.52it/s]
100%|██████████| 17/17 [00:00<00:00, 461.00it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 215.91it/s]


Epoch [901/6000]: Train loss: 4.9676, Valid loss: 4.9437


100%|██████████| 17/17 [00:00<00:00, 487.35it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]


Saving model with loss 4.529...


100%|██████████| 17/17 [00:00<00:00, 710.72it/s]
100%|██████████| 17/17 [00:00<00:00, 628.09it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 588.57it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 605.45it/s]
100%|██████████| 17/17 [00:00<00:00, 609.21it/s]
100%|██████████| 17/17 [00:00<00:00, 426.43it/s]
100%|██████████| 17/17 [00:00<00:00, 340.52it/s]
100%|██████████| 17/17 [00:00<00:00, 516.87it/s]
100%|██████████| 17/17 [00:00<00:00, 590.54it/s]
100%|██████████| 17/17 [00:00<00:00, 655.99it/s]
100%|██████████| 17/17 [00:00<00:00, 631.72it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 631.77it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]


Epoch [921/6000]: Train loss: 4.8837, Valid loss: 4.9856


100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 723.65it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 550.23it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 710.73it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 672.81it/s]
100%|██████████| 17/17 [00:00<00:00, 745.40it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.06it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]


Saving model with loss 4.506...


100%|██████████| 17/17 [00:00<00:00, 678.07it/s]


Epoch [941/6000]: Train loss: 4.7938, Valid loss: 5.1741


100%|██████████| 17/17 [00:00<00:00, 710.67it/s]
100%|██████████| 17/17 [00:00<00:00, 775.31it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]


Saving model with loss 4.387...


100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.72it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]


Saving model with loss 4.382...


100%|██████████| 17/17 [00:00<00:00, 631.76it/s]
100%|██████████| 17/17 [00:00<00:00, 682.26it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 488.56it/s]
100%|██████████| 17/17 [00:00<00:00, 495.17it/s]


Epoch [961/6000]: Train loss: 4.7172, Valid loss: 4.4524


100%|██████████| 17/17 [00:00<00:00, 386.54it/s]
100%|██████████| 17/17 [00:00<00:00, 487.34it/s]
100%|██████████| 17/17 [00:00<00:00, 542.67it/s]
100%|██████████| 17/17 [00:00<00:00, 545.50it/s]
100%|██████████| 17/17 [00:00<00:00, 533.02it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 533.04it/s]


Saving model with loss 4.263...


100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 588.18it/s]
100%|██████████| 17/17 [00:00<00:00, 588.18it/s]
100%|██████████| 17/17 [00:00<00:00, 596.16it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 550.23it/s]
100%|██████████| 17/17 [00:00<00:00, 540.14it/s]
100%|██████████| 17/17 [00:00<00:00, 550.22it/s]


Saving model with loss 4.253...


100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 626.16it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]


Epoch [981/6000]: Train loss: 4.6423, Valid loss: 4.3242


100%|██████████| 17/17 [00:00<00:00, 550.22it/s]
100%|██████████| 17/17 [00:00<00:00, 588.18it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 564.77it/s]

Saving model with loss 4.135...



100%|██████████| 17/17 [00:00<00:00, 568.55it/s]
100%|██████████| 17/17 [00:00<00:00, 609.16it/s]
100%|██████████| 17/17 [00:00<00:00, 568.55it/s]
100%|██████████| 17/17 [00:00<00:00, 437.36it/s]


Saving model with loss 4.133...


100%|██████████| 17/17 [00:00<00:00, 569.23it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 681.77it/s]
100%|██████████| 17/17 [00:00<00:00, 379.04it/s]
100%|██████████| 17/17 [00:00<00:00, 387.65it/s]
100%|██████████| 17/17 [00:00<00:00, 406.12it/s]
100%|██████████| 17/17 [00:00<00:00, 473.80it/s]
100%|██████████| 17/17 [00:00<00:00, 531.44it/s]
100%|██████████| 17/17 [00:00<00:00, 550.21it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]


Epoch [1001/6000]: Train loss: 4.5463, Valid loss: 4.1452


100%|██████████| 17/17 [00:00<00:00, 609.16it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 682.26it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.26it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 741.59it/s]
100%|██████████| 17/17 [00:00<00:00, 682.25it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]


Saving model with loss 4.037...


100%|██████████| 17/17 [00:00<00:00, 518.67it/s]
100%|██████████| 17/17 [00:00<00:00, 631.76it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]


Epoch [1021/6000]: Train loss: 4.4726, Valid loss: 4.2251


100%|██████████| 17/17 [00:00<00:00, 631.71it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 631.72it/s]
100%|██████████| 17/17 [00:00<00:00, 643.27it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 588.19it/s]
100%|██████████| 17/17 [00:00<00:00, 567.85it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]


Saving model with loss 3.959...


100%|██████████| 17/17 [00:00<00:00, 533.02it/s]
100%|██████████| 17/17 [00:00<00:00, 533.02it/s]
100%|██████████| 17/17 [00:00<00:00, 559.14it/s]
100%|██████████| 17/17 [00:00<00:00, 609.20it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 564.19it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 550.23it/s]


Epoch [1041/6000]: Train loss: 4.3841, Valid loss: 4.5605


100%|██████████| 17/17 [00:00<00:00, 507.31it/s]
100%|██████████| 17/17 [00:00<00:00, 550.20it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]


Saving model with loss 3.925...


100%|██████████| 17/17 [00:00<00:00, 487.33it/s]
100%|██████████| 17/17 [00:00<00:00, 568.53it/s]


Saving model with loss 3.910...


100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 550.23it/s]
100%|██████████| 17/17 [00:00<00:00, 533.03it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]


Saving model with loss 3.892...


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]


Epoch [1061/6000]: Train loss: 4.3030, Valid loss: 3.8639
Saving model with loss 3.864...


100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 550.23it/s]
100%|██████████| 17/17 [00:00<00:00, 533.04it/s]


Saving model with loss 3.723...


100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 533.02it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 696.03it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 643.51it/s]
100%|██████████| 17/17 [00:00<00:00, 682.34it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.22it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 655.98it/s]


Epoch [1081/6000]: Train loss: 4.2281, Valid loss: 4.2226


100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 666.00it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]


Saving model with loss 3.668...


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.23it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 696.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 643.51it/s]


Epoch [1101/6000]: Train loss: 4.1473, Valid loss: 4.1045


100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 668.77it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 668.68it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 725.67it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 609.12it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.05it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]


Saving model with loss 3.627...


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]


Epoch [1121/6000]: Train loss: 4.0695, Valid loss: 3.8583


100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 643.54it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 656.05it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]


Epoch [1141/6000]: Train loss: 3.9848, Valid loss: 3.6944


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 643.54it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 754.63it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]


Saving model with loss 3.509...


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 710.64it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 588.13it/s]
100%|██████████| 17/17 [00:00<00:00, 631.72it/s]


Epoch [1161/6000]: Train loss: 3.9181, Valid loss: 3.7232


100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 643.52it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.06it/s]
100%|██████████| 17/17 [00:00<00:00, 696.03it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 620.14it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 665.26it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.22it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.77it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 631.34it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 189.51it/s]


Epoch [1181/6000]: Train loss: 3.8351, Valid loss: 4.6625


100%|██████████| 17/17 [00:00<00:00, 254.39it/s]


Saving model with loss 3.482...


100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 682.26it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 775.30it/s]
100%|██████████| 17/17 [00:00<00:00, 720.31it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 691.34it/s]
100%|██████████| 17/17 [00:00<00:00, 775.31it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 741.64it/s]
100%|██████████| 17/17 [00:00<00:00, 745.61it/s]


Saving model with loss 3.481...


100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 273.71it/s]


Saving model with loss 3.401...


100%|██████████| 17/17 [00:00<00:00, 460.99it/s]
100%|██████████| 17/17 [00:00<00:00, 516.88it/s]


Epoch [1201/6000]: Train loss: 3.7549, Valid loss: 3.4546


100%|██████████| 17/17 [00:00<00:00, 501.70it/s]
100%|██████████| 17/17 [00:00<00:00, 448.85it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 611.38it/s]
100%|██████████| 17/17 [00:00<00:00, 609.16it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 637.69it/s]


Saving model with loss 3.382...


100%|██████████| 17/17 [00:00<00:00, 775.31it/s]
100%|██████████| 17/17 [00:00<00:00, 775.31it/s]
100%|██████████| 17/17 [00:00<00:00, 696.05it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 682.24it/s]
100%|██████████| 17/17 [00:00<00:00, 775.30it/s]
100%|██████████| 17/17 [00:00<00:00, 710.72it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 696.06it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]


Epoch [1221/6000]: Train loss: 3.6778, Valid loss: 3.4437


100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]


Saving model with loss 3.364...


100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.51it/s]
100%|██████████| 17/17 [00:00<00:00, 775.31it/s]
100%|██████████| 17/17 [00:00<00:00, 741.59it/s]


Saving model with loss 3.285...


100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 741.73it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]


Saving model with loss 3.193...


100%|██████████| 17/17 [00:00<00:00, 775.31it/s]
100%|██████████| 17/17 [00:00<00:00, 812.17it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]


Epoch [1241/6000]: Train loss: 3.6026, Valid loss: 3.8644


100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 725.68it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 643.54it/s]
100%|██████████| 17/17 [00:00<00:00, 682.63it/s]
100%|██████████| 17/17 [00:00<00:00, 668.16it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 533.03it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 568.57it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]


Epoch [1261/6000]: Train loss: 3.5274, Valid loss: 3.3153


100%|██████████| 17/17 [00:00<00:00, 568.58it/s]
100%|██████████| 17/17 [00:00<00:00, 516.87it/s]
100%|██████████| 17/17 [00:00<00:00, 550.45it/s]
100%|██████████| 17/17 [00:00<00:00, 550.22it/s]
100%|██████████| 17/17 [00:00<00:00, 550.22it/s]
100%|██████████| 17/17 [00:00<00:00, 568.55it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 550.22it/s]
100%|██████████| 17/17 [00:00<00:00, 533.02it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 568.57it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]


Saving model with loss 3.058...


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 609.16it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]


Epoch [1281/6000]: Train loss: 3.4487, Valid loss: 3.4498


100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 609.19it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 577.34it/s]
100%|██████████| 17/17 [00:00<00:00, 533.03it/s]
100%|██████████| 17/17 [00:00<00:00, 566.88it/s]
100%|██████████| 17/17 [00:00<00:00, 487.33it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]


Saving model with loss 3.007...


100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]


Epoch [1301/6000]: Train loss: 3.3741, Valid loss: 3.7675


100%|██████████| 17/17 [00:00<00:00, 631.72it/s]
100%|██████████| 17/17 [00:00<00:00, 650.54it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 656.08it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]


Saving model with loss 2.978...


100%|██████████| 17/17 [00:00<00:00, 631.73it/s]


Epoch [1321/6000]: Train loss: 3.3021, Valid loss: 3.1981


100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 609.19it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 667.08it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.76it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 309.92it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]


Saving model with loss 2.921...


100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 310.13it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]


Epoch [1341/6000]: Train loss: 3.2379, Valid loss: 3.2502


100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 290.59it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 289.08it/s]
100%|██████████| 17/17 [00:00<00:00, 299.25it/s]
100%|██████████| 17/17 [00:00<00:00, 315.87it/s]


Saving model with loss 2.805...


100%|██████████| 17/17 [00:00<00:00, 307.30it/s]


Saving model with loss 2.804...


100%|██████████| 17/17 [00:00<00:00, 318.77it/s]
100%|██████████| 17/17 [00:00<00:00, 315.87it/s]
100%|██████████| 17/17 [00:00<00:00, 312.92it/s]
100%|██████████| 17/17 [00:00<00:00, 297.89it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 310.09it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 315.87it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 315.86it/s]
100%|██████████| 17/17 [00:00<00:00, 306.72it/s]


Epoch [1361/6000]: Train loss: 3.1705, Valid loss: 2.9327


100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 304.58it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]


Saving model with loss 2.735...


100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 310.11it/s]
100%|██████████| 17/17 [00:00<00:00, 294.09it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 304.22it/s]
100%|██████████| 17/17 [00:00<00:00, 299.25it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 289.08it/s]
100%|██████████| 17/17 [00:00<00:00, 294.06it/s]


Epoch [1381/6000]: Train loss: 3.1090, Valid loss: 2.9696


100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 299.25it/s]
100%|██████████| 17/17 [00:00<00:00, 291.54it/s]
100%|██████████| 17/17 [00:00<00:00, 286.03it/s]
100%|██████████| 17/17 [00:00<00:00, 274.13it/s]
100%|██████████| 17/17 [00:00<00:00, 249.51it/s]
100%|██████████| 17/17 [00:00<00:00, 221.52it/s]
100%|██████████| 17/17 [00:00<00:00, 228.92it/s]
100%|██████████| 17/17 [00:00<00:00, 230.50it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]


Saving model with loss 2.703...


100%|██████████| 17/17 [00:00<00:00, 272.01it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 288.75it/s]
100%|██████████| 17/17 [00:00<00:00, 259.95it/s]
100%|██████████| 17/17 [00:00<00:00, 294.09it/s]
100%|██████████| 17/17 [00:00<00:00, 254.57it/s]
100%|██████████| 17/17 [00:00<00:00, 247.20it/s]
100%|██████████| 17/17 [00:00<00:00, 258.44it/s]
100%|██████████| 17/17 [00:00<00:00, 236.90it/s]
100%|██████████| 17/17 [00:00<00:00, 258.44it/s]


Epoch [1401/6000]: Train loss: 3.0417, Valid loss: 3.1520


100%|██████████| 17/17 [00:00<00:00, 243.67it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 266.50it/s]
100%|██████████| 17/17 [00:00<00:00, 284.38it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 240.22it/s]
100%|██████████| 17/17 [00:00<00:00, 242.82it/s]
100%|██████████| 17/17 [00:00<00:00, 233.64it/s]
100%|██████████| 17/17 [00:00<00:00, 236.90it/s]
100%|██████████| 17/17 [00:00<00:00, 293.24it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 277.32it/s]


Saving model with loss 2.664...


100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 268.57it/s]
100%|██████████| 17/17 [00:00<00:00, 291.52it/s]
100%|██████████| 17/17 [00:00<00:00, 292.26it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 289.09it/s]


Epoch [1421/6000]: Train loss: 2.9815, Valid loss: 2.5755
Saving model with loss 2.576...


100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 297.69it/s]
100%|██████████| 17/17 [00:00<00:00, 285.40it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 277.49it/s]
100%|██████████| 17/17 [00:00<00:00, 295.15it/s]
100%|██████████| 17/17 [00:00<00:00, 268.51it/s]
100%|██████████| 17/17 [00:00<00:00, 274.08it/s]
100%|██████████| 17/17 [00:00<00:00, 274.38it/s]
100%|██████████| 17/17 [00:00<00:00, 224.43it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 281.38it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 264.02it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]


Epoch [1441/6000]: Train loss: 2.9206, Valid loss: 2.7164


100%|██████████| 17/17 [00:00<00:00, 258.44it/s]
100%|██████████| 17/17 [00:00<00:00, 258.44it/s]
100%|██████████| 17/17 [00:00<00:00, 260.38it/s]
100%|██████████| 17/17 [00:00<00:00, 261.82it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 254.58it/s]
100%|██████████| 17/17 [00:00<00:00, 275.09it/s]
100%|██████████| 17/17 [00:00<00:00, 254.58it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 279.60it/s]
100%|██████████| 17/17 [00:00<00:00, 250.84it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 272.87it/s]
100%|██████████| 17/17 [00:00<00:00, 269.94it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 286.58it/s]


Epoch [1461/6000]: Train loss: 2.8655, Valid loss: 2.9606


100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 295.76it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 254.57it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 247.19it/s]


Saving model with loss 2.441...


100%|██████████| 17/17 [00:00<00:00, 233.65it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 260.38it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 277.49it/s]
100%|██████████| 17/17 [00:00<00:00, 247.37it/s]
100%|██████████| 17/17 [00:00<00:00, 247.06it/s]
100%|██████████| 17/17 [00:00<00:00, 250.83it/s]
100%|██████████| 17/17 [00:00<00:00, 266.52it/s]
100%|██████████| 17/17 [00:00<00:00, 272.18it/s]
100%|██████████| 17/17 [00:00<00:00, 262.40it/s]


Epoch [1481/6000]: Train loss: 2.8058, Valid loss: 2.7249


100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 281.63it/s]
100%|██████████| 17/17 [00:00<00:00, 279.81it/s]
100%|██████████| 17/17 [00:00<00:00, 286.79it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 285.81it/s]
100%|██████████| 17/17 [00:00<00:00, 243.67it/s]
100%|██████████| 17/17 [00:00<00:00, 254.58it/s]
100%|██████████| 17/17 [00:00<00:00, 281.53it/s]


Saving model with loss 2.397...


100%|██████████| 17/17 [00:00<00:00, 243.67it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 289.09it/s]
100%|██████████| 17/17 [00:00<00:00, 266.52it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 281.48it/s]
100%|██████████| 17/17 [00:00<00:00, 265.21it/s]
100%|██████████| 17/17 [00:00<00:00, 294.09it/s]
100%|██████████| 17/17 [00:00<00:00, 285.00it/s]
100%|██████████| 17/17 [00:00<00:00, 252.84it/s]


Epoch [1501/6000]: Train loss: 2.7514, Valid loss: 2.7185


100%|██████████| 17/17 [00:00<00:00, 279.78it/s]
100%|██████████| 17/17 [00:00<00:00, 233.66it/s]
100%|██████████| 17/17 [00:00<00:00, 234.45it/s]
100%|██████████| 17/17 [00:00<00:00, 279.33it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]


Saving model with loss 2.371...


100%|██████████| 17/17 [00:00<00:00, 258.02it/s]
100%|██████████| 17/17 [00:00<00:00, 283.53it/s]


Saving model with loss 2.337...


100%|██████████| 17/17 [00:00<00:00, 279.60it/s]
100%|██████████| 17/17 [00:00<00:00, 289.08it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 291.16it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 294.07it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 266.49it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 266.52it/s]
100%|██████████| 17/17 [00:00<00:00, 294.22it/s]
100%|██████████| 17/17 [00:00<00:00, 261.89it/s]


Epoch [1521/6000]: Train loss: 2.6994, Valid loss: 2.4586


100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 277.53it/s]
100%|██████████| 17/17 [00:00<00:00, 270.65it/s]
100%|██████████| 17/17 [00:00<00:00, 247.21it/s]
100%|██████████| 17/17 [00:00<00:00, 235.25it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 268.59it/s]
100%|██████████| 17/17 [00:00<00:00, 270.75it/s]
100%|██████████| 17/17 [00:00<00:00, 279.60it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 284.27it/s]
100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 266.80it/s]
100%|██████████| 17/17 [00:00<00:00, 281.92it/s]


Epoch [1541/6000]: Train loss: 2.6554, Valid loss: 2.5958


100%|██████████| 17/17 [00:00<00:00, 262.42it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 283.13it/s]
100%|██████████| 17/17 [00:00<00:00, 248.98it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 247.20it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 178.90it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 266.51it/s]
100%|██████████| 17/17 [00:00<00:00, 258.44it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 253.51it/s]
100%|██████████| 17/17 [00:00<00:00, 296.41it/s]
100%|██████████| 17/17 [00:00<00:00, 305.00it/s]
100%|██████████| 17/17 [00:00<00:00, 311.80it/s]
100%|██████████| 17/17 [00:00<00:00, 315.84it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 307.29it/s]


Epoch [1561/6000]: Train loss: 2.6104, Valid loss: 2.3559


100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 317.93it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 315.88it/s]
100%|██████████| 17/17 [00:00<00:00, 313.64it/s]


Saving model with loss 2.312...


100%|██████████| 17/17 [00:00<00:00, 301.53it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 309.51it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 314.33it/s]
100%|██████████| 17/17 [00:00<00:00, 320.48it/s]
100%|██████████| 17/17 [00:00<00:00, 315.86it/s]
100%|██████████| 17/17 [00:00<00:00, 302.83it/s]
100%|██████████| 17/17 [00:00<00:00, 308.20it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 308.19it/s]
100%|██████████| 17/17 [00:00<00:00, 315.86it/s]
100%|██████████| 17/17 [00:00<00:00, 299.25it/s]
100%|██████████| 17/17 [00:00<00:00, 297.18it/s]


Epoch [1581/6000]: Train loss: 2.5626, Valid loss: 2.5463


100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 310.13it/s]
100%|██████████| 17/17 [00:00<00:00, 215.91it/s]
100%|██████████| 17/17 [00:00<00:00, 196.06it/s]
100%|██████████| 17/17 [00:00<00:00, 239.13it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 283.17it/s]
100%|██████████| 17/17 [00:00<00:00, 210.58it/s]


Saving model with loss 2.281...


100%|██████████| 17/17 [00:00<00:00, 294.08it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 203.06it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 219.83it/s]


Saving model with loss 2.263...


100%|██████████| 17/17 [00:00<00:00, 182.05it/s]
100%|██████████| 17/17 [00:00<00:00, 277.31it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 270.74it/s]
100%|██████████| 17/17 [00:00<00:00, 279.60it/s]


Epoch [1601/6000]: Train loss: 2.5242, Valid loss: 2.2006
Saving model with loss 2.201...


100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 310.11it/s]
100%|██████████| 17/17 [00:00<00:00, 306.19it/s]
100%|██████████| 17/17 [00:00<00:00, 315.88it/s]
100%|██████████| 17/17 [00:00<00:00, 312.92it/s]
100%|██████████| 17/17 [00:00<00:00, 306.58it/s]
100%|██████████| 17/17 [00:00<00:00, 284.28it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 289.09it/s]
100%|██████████| 17/17 [00:00<00:00, 310.12it/s]


Saving model with loss 2.168...


100%|██████████| 17/17 [00:00<00:00, 310.12it/s]
100%|██████████| 17/17 [00:00<00:00, 309.45it/s]
100%|██████████| 17/17 [00:00<00:00, 299.25it/s]
100%|██████████| 17/17 [00:00<00:00, 258.44it/s]
100%|██████████| 17/17 [00:00<00:00, 315.86it/s]
100%|██████████| 17/17 [00:00<00:00, 310.13it/s]
100%|██████████| 17/17 [00:00<00:00, 289.10it/s]
100%|██████████| 17/17 [00:00<00:00, 268.34it/s]
100%|██████████| 17/17 [00:00<00:00, 315.87it/s]


Epoch [1621/6000]: Train loss: 2.4848, Valid loss: 2.2959


100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 279.62it/s]
100%|██████████| 17/17 [00:00<00:00, 264.43it/s]
100%|██████████| 17/17 [00:00<00:00, 310.13it/s]
100%|██████████| 17/17 [00:00<00:00, 301.48it/s]
100%|██████████| 17/17 [00:00<00:00, 262.97it/s]
100%|██████████| 17/17 [00:00<00:00, 268.58it/s]


Saving model with loss 2.163...


100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 310.09it/s]
100%|██████████| 17/17 [00:00<00:00, 302.17it/s]
100%|██████████| 17/17 [00:00<00:00, 310.13it/s]
100%|██████████| 17/17 [00:00<00:00, 301.97it/s]
100%|██████████| 17/17 [00:00<00:00, 297.63it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 299.25it/s]
100%|██████████| 17/17 [00:00<00:00, 247.20it/s]
100%|██████████| 17/17 [00:00<00:00, 275.11it/s]
100%|██████████| 17/17 [00:00<00:00, 276.85it/s]
100%|██████████| 17/17 [00:00<00:00, 240.30it/s]


Saving model with loss 2.096...


100%|██████████| 17/17 [00:00<00:00, 268.58it/s]


Epoch [1641/6000]: Train loss: 2.4477, Valid loss: 2.3012


100%|██████████| 17/17 [00:00<00:00, 289.09it/s]
100%|██████████| 17/17 [00:00<00:00, 299.24it/s]
100%|██████████| 17/17 [00:00<00:00, 304.59it/s]
100%|██████████| 17/17 [00:00<00:00, 89.21it/s]
100%|██████████| 17/17 [00:00<00:00, 233.35it/s]
100%|██████████| 17/17 [00:00<00:00, 198.84it/s]
100%|██████████| 17/17 [00:00<00:00, 252.02it/s]
100%|██████████| 17/17 [00:00<00:00, 262.41it/s]
100%|██████████| 17/17 [00:00<00:00, 240.23it/s]
100%|██████████| 17/17 [00:00<00:00, 227.42it/s]
100%|██████████| 17/17 [00:00<00:00, 460.99it/s]
100%|██████████| 17/17 [00:00<00:00, 348.10it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 501.68it/s]
100%|██████████| 17/17 [00:00<00:00, 568.58it/s]
100%|██████████| 17/17 [00:00<00:00, 448.87it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 609.11it/s]
100%|██████████| 17/17 [00:00<00:00, 473.80it/s]


Epoch [1661/6000]: Train loss: 2.4158, Valid loss: 2.2059


100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 655.94it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]


Saving model with loss 2.086...


100%|██████████| 17/17 [00:00<00:00, 682.31it/s]
100%|██████████| 17/17 [00:00<00:00, 550.23it/s]
100%|██████████| 17/17 [00:00<00:00, 189.52it/s]
100%|██████████| 17/17 [00:00<00:00, 501.70it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 588.18it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 487.37it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 655.34it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.72it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]


Epoch [1681/6000]: Train loss: 2.3825, Valid loss: 2.1355


100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 575.68it/s]


Saving model with loss 2.035...


100%|██████████| 17/17 [00:00<00:00, 550.23it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 588.16it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 647.76it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 767.25it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]


Epoch [1701/6000]: Train loss: 2.3556, Valid loss: 2.1390


100%|██████████| 17/17 [00:00<00:00, 710.72it/s]
100%|██████████| 17/17 [00:00<00:00, 539.49it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 682.31it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 695.97it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]


Saving model with loss 1.998...


100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 695.98it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.72it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 710.59it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]


Epoch [1721/6000]: Train loss: 2.3299, Valid loss: 2.1283


100%|██████████| 17/17 [00:00<00:00, 682.19it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 741.59it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]


Saving model with loss 1.956...


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 692.99it/s]
100%|██████████| 17/17 [00:00<00:00, 656.05it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 741.62it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 677.76it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.26it/s]
100%|██████████| 17/17 [00:00<00:00, 609.20it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]


Epoch [1741/6000]: Train loss: 2.3020, Valid loss: 2.1522


100%|██████████| 17/17 [00:00<00:00, 710.73it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 741.61it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 741.60it/s]


Saving model with loss 1.925...


100%|██████████| 17/17 [00:00<00:00, 682.29it/s]


Epoch [1761/6000]: Train loss: 2.2744, Valid loss: 1.9645


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 710.72it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 656.05it/s]
100%|██████████| 17/17 [00:00<00:00, 710.69it/s]
100%|██████████| 17/17 [00:00<00:00, 710.70it/s]
100%|██████████| 17/17 [00:00<00:00, 693.39it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]


Saving model with loss 1.866...


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 710.62it/s]
100%|██████████| 17/17 [00:00<00:00, 710.73it/s]
100%|██████████| 17/17 [00:00<00:00, 684.56it/s]


Epoch [1781/6000]: Train loss: 2.2553, Valid loss: 2.2877


100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.18it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 710.59it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 620.08it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 620.09it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 668.75it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]


Epoch [1801/6000]: Train loss: 2.2290, Valid loss: 1.9677


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 568.56it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 631.76it/s]
100%|██████████| 17/17 [00:00<00:00, 588.17it/s]
100%|██████████| 17/17 [00:00<00:00, 609.20it/s]
100%|██████████| 17/17 [00:00<00:00, 609.18it/s]
100%|██████████| 17/17 [00:00<00:00, 661.73it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 656.07it/s]
100%|██████████| 17/17 [00:00<00:00, 690.83it/s]
100%|██████████| 17/17 [00:00<00:00, 656.05it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]


Epoch [1821/6000]: Train loss: 2.2156, Valid loss: 2.3626


100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 656.05it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 609.19it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 674.46it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 609.15it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 631.76it/s]
100%|██████████| 17/17 [00:00<00:00, 682.26it/s]
100%|██████████| 17/17 [00:00<00:00, 682.16it/s]
100%|██████████| 17/17 [00:00<00:00, 682.35it/s]


Epoch [1841/6000]: Train loss: 2.1962, Valid loss: 2.1226


100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 631.64it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.31it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.31it/s]
100%|██████████| 17/17 [00:00<00:00, 656.07it/s]
100%|██████████| 17/17 [00:00<00:00, 682.31it/s]
100%|██████████| 17/17 [00:00<00:00, 682.18it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.02it/s]


Saving model with loss 1.853...


100%|██████████| 17/17 [00:00<00:00, 655.93it/s]
100%|██████████| 17/17 [00:00<00:00, 609.19it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 696.00it/s]
100%|██████████| 17/17 [00:00<00:00, 631.75it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]


Saving model with loss 1.853...


100%|██████████| 17/17 [00:00<00:00, 668.71it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]


Epoch [1861/6000]: Train loss: 2.1781, Valid loss: 1.8747


100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 567.84it/s]
100%|██████████| 17/17 [00:00<00:00, 617.04it/s]
100%|██████████| 17/17 [00:00<00:00, 609.16it/s]
100%|██████████| 17/17 [00:00<00:00, 631.76it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]


Saving model with loss 1.827...


100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]


Epoch [1881/6000]: Train loss: 2.1601, Valid loss: 1.8761


100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 631.73it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 710.71it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 640.96it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]


Saving model with loss 1.801...


100%|██████████| 17/17 [00:00<00:00, 682.29it/s]
100%|██████████| 17/17 [00:00<00:00, 609.17it/s]


Saving model with loss 1.769...


100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 656.17it/s]


Epoch [1901/6000]: Train loss: 2.1465, Valid loss: 2.1125


100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.22it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 656.01it/s]
100%|██████████| 17/17 [00:00<00:00, 656.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 643.03it/s]
100%|██████████| 17/17 [00:00<00:00, 656.04it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
100%|██████████| 17/17 [00:00<00:00, 682.28it/s]
100%|██████████| 17/17 [00:00<00:00, 656.14it/s]
100%|██████████| 17/17 [00:00<00:00, 631.74it/s]
100%|██████████| 17/17 [00:00<00:00, 682.27it/s]
  0%|          | 0/17 [00:00<?, ?it/s]

# Plot learning curves with `tensorboard` (optional)

`tensorboard` is a tool that allows you to visualize your training progress.

If this block does not display your learning curve, please wait for few minutes, and re-run this block. It might take some time to load your logging information. 

In [None]:
# %reload_ext tensorboard
# %tensorboard --logdir=./runs/

# Testing
The predictions of your model on testing set will be stored at `pred.csv`.

In [None]:
def save_pred(preds, file):
    ''' Save predictions to specified file '''
    with open(file, 'w') as fp:
        writer = csv.writer(fp)
        writer.writerow(['id', 'tested_positive'])
        for i, p in enumerate(preds):
            writer.writerow([i, p])

model = My_Model(input_dim=x_train.shape[1]).to(device)
model.load_state_dict(torch.load(config['save_path']))
preds = predict(test_loader, model, device) 
save_pred(preds, 'pred05041716.csv')

# Reference
This notebook uses code written by Heng-Jui Chang @ NTUEE (https://github.com/ga642381/ML2021-Spring/blob/main/HW01/HW01.ipynb)