In [1]:
link = 'D:/users/Marko/downloads/mirna/'

# Imports

In [2]:
%load_ext tensorboard

In [3]:
import sys
#sys.path.insert(0,'/content/drive/MyDrive/Marko/master')
sys.path.insert(0, link)
import numpy as np
import matplotlib.pyplot as plt

#import tensorflow as tf

import torch
import torch.optim as optim
import torch.nn as nn
import torch.distributions as dist

from torch.nn import functional as F
from torchinfo import summary
from torch.utils.tensorboard import SummaryWriter
from torch.utils.data import Dataset, DataLoader

from sklearn.preprocessing import OneHotEncoder

from tqdm import tqdm
from tqdm import trange

import datetime


writer = SummaryWriter(f"{link}/saved_models/VAEFC/tensorboard")

In [4]:
DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu")

In [5]:
DEVICE

device(type='cuda')

# Model Classes

In [6]:
class diva_args:

    def __init__(self, z_dim=64, d_dim=45, x_dim=7500, y_dim=2,
                 beta=10, rec_alpha = 1, rec_beta = 1, 
                 rec_gamma = 1, warmup = 1, prewarmup = 1):

        self.z_dim = z_dim
        self.d_dim = d_dim
        self.x_dim = x_dim
        self.y_dim = y_dim
        
        self.beta = beta
        self.rec_alpha = rec_alpha
        self.rec_beta = rec_beta
        self.rec_gamma = rec_gamma
        self.warmup = warmup
        self.prewarmup = prewarmup


## Dataset Class

In [7]:
class MicroRNADataset(Dataset):

    def __init__(self, ds='train', create_encodings=False, use_subset=False):
        
        # loading images
        self.images = np.load(f'{link}/data/modmirbase_{ds}_images.npz')['arr_0']/255
        
        
        # loading labels
        print('Loading Labels! (~10s)')     
        ohe = OneHotEncoder(categories='auto', sparse=False)
        labels = np.load(f'{link}/data/modmirbase_{ds}_labels.npz')['arr_0']
        self.labels = ohe.fit_transform(labels)
        
        # loading encoded images
        print("loading encodings")
        if create_encodings:
            x_len, x_col, x_bar = self.get_encoded_values(self.images, ds)
        else:
            x_len = np.load(f'{link}/data/modmirbase_{ds}_images_len2.npz')
            x_bar = np.load(f'{link}/data/modmirbase_{ds}_images_bar2.npz')
            x_col = np.load(f'{link}/data/modmirbase_{ds}_images_col2.npz')
        
        self.x_len = x_len
        self.x_bar = x_bar
        self.x_col = x_col
        

        # loading names
        print('Loading Names! (~5s)')
        names =  np.load(f'{link}/data/modmirbase_{ds}_names.npz')['arr_0']
        names = [i.decode('utf-8') for i in names]
        self.species = ['mmu', 'prd', 'hsa', 'ptr', 'efu', 'cbn', 'gma', 'pma',
                        'cel', 'gga', 'ipu', 'ptc', 'mdo', 'cgr', 'bta', 'cin', 
                        'ppy', 'ssc', 'ath', 'cfa', 'osa', 'mtr', 'gra', 'mml',
                        'stu', 'bdi', 'rno', 'oan', 'dre', 'aca', 'eca', 'chi',
                        'bmo', 'ggo', 'aly', 'dps', 'mdm', 'ame', 'ppc', 'ssa',
                        'ppt', 'tca', 'dme', 'sbi']
        # assigning a species label to each observation from species
        # with more than 200 observations from past research
        self.names = []
        for i in names:
            append = False
            for j in self.species:
                if j in i.lower():
                    self.names.append(j)
                    append = True
                    break
            if not append:
                if 'random' in i.lower() or i.isdigit():
                    self.names.append('hsa')
                else:
                    self.names.append('notfound')
        
        # performing one hot encoding
        ohe = OneHotEncoder(categories='auto', sparse=False)
        
       
        
        self.names_ohe = ohe.fit_transform(np.array(self.names).reshape(-1,1))
          
        if use_subset:    
            idxes = [i == 'hsa' and np.random.choice([True, False]) for i in self.names]
            self.names_ohe = self.names_ohe[idxes]
            self.labels = self.labels[idxes]
            self.images = self.images[idxes]
            self.x_len = self.x_len[idxes]
            self.x_col = self.x_col[idxes]
            self.x_bar = self.x_bar[idxes]

    
    def __len__(self):
        return(self.images.shape[0])

    def __getitem__(self, idx):
        d = self.names_ohe[idx]
        y = self.labels[idx]
        x = self.images[idx]
        x = np.transpose(x, (2,0,1))
        x_len = self.x_len[idx]
        x_col = self.x_col[idx]
        x_bar = self.x_bar[idx]
        return (x, y, d, x_len, x_col, x_bar)


    def get_encoded_values(self, x, ds):
        """
        given an image or batch of images
        returns length of strand, length of bars and colors of bars
        """
        n = x.shape[0]
        x = np.transpose(x, (0,3,1,2))
        out_len = np.zeros((n), dtype=np.uint8)
        out_col = np.zeros((n,5,200), dtype=np.uint8)
        out_bar = np.zeros((n,2,100), dtype=np.uint8)

        for i in range(n):
            if i % 100 == 0:
                print(f'at {i} out of {n}')
            rna_len = 0
            broke = False
            for j in range(100):
                if (x[i,:,12,j] == np.array([1,1,1])).all():
                    out_len[i] = rna_len
                    broke = True
                    break
                else:
                    rna_len += 1
                    # check color of bars
                    out_col[i, self.get_color(x[i,:,12,j]) ,2*j] = 1 
                    out_col[i, self.get_color(x[i,:,13,j]), 2*j+1] = 1
                    # check length of bars
                    len1 = 0
                    # loop until white pixel
                    while not (x[i,:,12-len1,j] == np.array([1.,1.,1.])).all():
                        len1 += 1
                        if 13-len1 == 0:
                            break
                    out_bar[i, 0, j] = len1

                    len2 = 0
                    while not (x[i,:,13+len2,j] == np.array([1.,1.,1.])).all():
                        len2 += 1
                        if 13+len2 == 25:
                            break
                    out_bar[i, 1, j] = len2
            if not broke:
                out_len[i] = rna_len


        with open(f'{link}/data/modmirbase_{ds}_images_len2.npz', 'wb') as f:
            np.save(f, out_len)
        with open(f'{link}/data/modmirbase_{ds}_images_col2.npz', 'wb') as f:
            np.save(f, out_col)
        with open(f'{link}/data/modmirbase_{ds}_images_bar2.npz', 'wb') as f:
            np.save(f, out_bar)
        

        return out_len, out_bar, out_col

    def get_color(self, pixel):
        """
        returns the encoded value for a pixel
        """
        if (pixel == np.array([0,0,0])).all():  
            return 0 # black
        elif (pixel == np.array([1,0,0])).all():  
            return 1 # red
        elif (pixel == np.array([0,0,1])).all():  
            return 2 # blue
        elif (pixel == np.array([0,1,0])).all():  
            return 3 # green
        elif (pixel == np.array([1,1,0])).all():  
            return 4 # yellow
        else:
            print("Something wrong!")


## Decoder classes

In [8]:
# Decoders
class px(nn.Module):
    def __init__(self, d_dim, x_dim, y_dim, z_dim, dim1=2000, dim2=1600):
        super(px, self).__init__()

        self.fc1 = nn.Sequential(nn.Linear(z_dim, dim1, bias=False),  
                                 nn.ReLU())
        
        self.fc2 = nn.Sequential(nn.Linear(dim1, dim2, bias=False),  
                                 nn.ReLU())
        
        # Predicting length and color of each bar
        
        # Predicting color of each bar
        self.color_bar_black = nn.Linear(dim2,200)
        self.color_bar_reddd = nn.Linear(dim2,200)
        self.color_bar_bluee = nn.Linear(dim2,200)
        self.color_bar_green = nn.Linear(dim2,200)
        self.color_bar_yelow = nn.Linear(dim2,200)
        
        # Predicting the length of each bar
        self.length_bar_top = nn.Sequential(nn.Linear(dim2,100), nn.Softplus())
        self.length_bar_bot = nn.Sequential(nn.Linear(dim2,100), nn.Softplus())
        #self.length_bar_scale = nn.Sequential(nn.Conv1d(100, 1, kernel_size = 3, padding = 'same', bias=False), nn.Sigmoid())
        
        # Predicting length of the RNA strand
        self.length_RNA = nn.Sequential(nn.Linear(dim2,400), nn.ReLU(),nn.Linear(400,1), nn.Softplus())
        #self.length_RNA_scale = nn.Sequential(nn.Linear(400,1, bias=False), nn.Sigmoid())
        
    def forward(self, z):
        
        h = self.fc1(z)
        h = self.fc2(h)
        
        len_RNA = self.length_RNA(h)
        
        len_RNA_sc = nn.Parameter(torch.tensor([1.])).to(DEVICE)
        #len_RNA_sc = torch.exp(self.length_RNA_scale(h))
        
        
        len_bar = torch.cat([self.length_bar_top(h)[:,None,:],self.length_bar_bot(h)[:,None,:]], dim=1) 
        len_bar_sc = nn.Parameter(torch.tensor([1.])).to(DEVICE)
        #len_bar_sc = torch.exp(self.length_bar_scale(h))
        
        
        black = self.color_bar_black(h)[:,None,:]
        reddd = self.color_bar_reddd(h)[:,None,:]
        bluee = self.color_bar_bluee(h)[:,None,:]
        green = self.color_bar_green(h)[:,None,:]
        yelow = self.color_bar_yelow(h)[:,None,:]
        
        col = torch.cat([black,reddd,bluee,green,yelow], dim=1)
        
        col_bar = nn.Softmax(dim=1)(col)
        
        return len_RNA, len_RNA_sc, len_bar, len_bar_sc, col_bar

    def reconstruct_image(self, len_RNA, var_RNA, len_bar, var_bar ,col_bar, sample=False):
        """
        reconstructs RNA image given output from decoder
        even indexes of len_bar and col_bar   -> top
        uneven indexes of len_bar and col_bar -> bottom
        function does not support sampling yet
        color reconstructions: 0: black
                               1: red
                               2: blue
                               3: green
                               4: yellow
        """
        color_dict = {
                  0: np.array([0,0,0]), # black
                  1: np.array([1,0,0]), # red
                  3: np.array([0,1,0]), # green
                  2: np.array([0,0,1]), # blue
                  4: np.array([1,1,0])  # yellow
                  }
    
        
        len_RNA = len_RNA.cpu().numpy()
        var_RNA = var_RNA.cpu().numpy()
        #.reshape((100,))
        len_bar = len_bar.cpu().numpy()
        var_bar = var_bar.cpu().numpy()
        col_bar = col_bar.cpu().numpy()
        n = len_RNA.shape[0]
        output = np.ones((n,25,100,3))

        for i in range(n):
            if sample:
                limit = int(np.round(np.random.normal(loc=len_RNA[i], scale=var_RNA[i])))
            else:
                limit = int(np.round(len_RNA[i]))
            limit = min(100, limit)
            for j in range(limit):
                if sample:
                    _len_bar_1 = int(np.round(np.random.normal(loc=len_bar[i,0,j], scale=var_bar[i,0,j])))
                    _len_bar_2 = int(np.round(np.random.normal(loc=len_bar[i,1,j], scale=var_bar[i,1,j])))
                    _col_bar_1 = np.random.choice(np.arange(5), p = col_bar[i, :, 2*j])
                    _col_bar_2 = np.random.choice(np.arange(5), p = col_bar[i,:, 2*j+1])
                else:
                    _len_bar_1 = int(np.round(len_bar[i,0,j])) 
                    _len_bar_2 = int(np.round(len_bar[i,1,j]))
                    _col_bar_1 = np.argmax(col_bar[i,:, 2*j])
                    _col_bar_2 = np.argmax(col_bar[i,:, 2*j+1])
                
                h1 = max(0,13-_len_bar_1)
                # paint upper bar
                output[i, h1:13, j] = color_dict[_col_bar_1]
                h2 = min(25,13+_len_bar_2)
                # paint lower bar
                output[i, 13:h2, j] = color_dict[_col_bar_2]
        
        
        return output


In [9]:
int(np.round(3.7, 0))
int(3.7)

3

In [10]:
# pzy_ = pzy(45, 7500, 2, 32,32,32)
# summary(pzy_, (1,2))
# pzy_ = px(45, 7500, 2, 32,32,32)
# summary(pzy_, [(1,32),(1,32),(1,32)])

## Endcoder Classes

In [11]:
#pzy_.reconstruct_image(torch.zeros((1,100)), torch.zeros((1,13,200)), torch.zeros(1,5,200)).shape

In [12]:
class qz(nn.Module):
    def __init__(self, d_dim, x_dim, y_dim, z_dim):
        super(qz, self).__init__()

        self.encoder = nn.Sequential(
            nn.Conv2d(3, 64, kernel_size=5, stride=1, padding = 'same',bias=False),
            nn.ReLU(),
            nn.MaxPool2d(2, 2),
            nn.Conv2d(64, 128, kernel_size=3, stride=1, padding = 'same', bias=False),
            nn.ReLU(), 
            nn.MaxPool2d(2, 2),
            nn.Conv2d(128, 256, kernel_size=3, stride=1, bias=False),
            nn.ReLU(), 
            nn.MaxPool2d(2, 2),
        )

        self.fc11 = nn.Sequential(nn.Linear(5632, z_dim))
        self.fc12 = nn.Sequential(nn.Linear(5632, z_dim), nn.Softplus())

        torch.nn.init.xavier_uniform_(self.encoder[0].weight)
        torch.nn.init.xavier_uniform_(self.encoder[3].weight)
        torch.nn.init.xavier_uniform_(self.fc11[0].weight)
        self.fc11[0].bias.data.zero_()
        torch.nn.init.xavier_uniform_(self.fc12[0].weight)
        self.fc12[0].bias.data.zero_()

    def forward(self, x):
        h = self.encoder(x)
        h = h.view(-1, 5632)
        z_loc = self.fc11(h)
        z_scale = self.fc12(h) + 1e-7

        return z_loc, z_scale




In [13]:
enc = qz(128,10,10,10)
summary(enc, (1,3,25,100))

Layer (type:depth-idx)                   Output Shape              Param #
qz                                       --                        --
├─Sequential: 1-1                        [1, 256, 2, 11]           --
│    └─Conv2d: 2-1                       [1, 64, 25, 100]          4,800
│    └─ReLU: 2-2                         [1, 64, 25, 100]          --
│    └─MaxPool2d: 2-3                    [1, 64, 12, 50]           --
│    └─Conv2d: 2-4                       [1, 128, 12, 50]          73,728
│    └─ReLU: 2-5                         [1, 128, 12, 50]          --
│    └─MaxPool2d: 2-6                    [1, 128, 6, 25]           --
│    └─Conv2d: 2-7                       [1, 256, 4, 23]           294,912
│    └─ReLU: 2-8                         [1, 256, 4, 23]           --
│    └─MaxPool2d: 2-9                    [1, 256, 2, 11]           --
├─Sequential: 1-2                        [1, 10]                   --
│    └─Linear: 2-10                      [1, 10]                   56,330

## Full model class

In [14]:
class StampDIVA(nn.Module):
    def __init__(self, args):
        super(StampDIVA, self).__init__()
        self.z_dim = args.z_dim
        self.d_dim = args.d_dim
        self.x_dim = args.x_dim
        self.y_dim = args.y_dim

        self.px = px(self.d_dim, self.x_dim, self.y_dim, self.z_dim)
        
        self.qz = qz(self.d_dim, self.x_dim, self.y_dim, self.z_dim)
        

        self.beta = args.beta
        
        self.rec_alpha = args.rec_alpha
        self.rec_beta = args.rec_beta
        self.rec_gamma = args.rec_gamma

        self.warmup = args.warmup
        self.prewarmup = args.prewarmup

        self.cuda()

    def forward(self, d, x, y):
        # Encode
        zd_q_loc, zd_q_scale = self.qz(x)
        
        # Reparameterization trick
        qz = dist.Normal(zd_q_loc, zd_q_scale)
        z_q = qz.rsample()
        
        
        # Decode
        x_len, x_len_scale, x_bar, x_bar_scale, x_col = self.px(z_q)
        z_p_loc, z_p_scale = torch.zeros(z_q.size()[0], self.z_dim).cuda(),\
                        torch.ones(z_q.size()[0], self.z_dim).cuda()
        pz = dist.Normal(z_p_loc, z_p_scale)

        # Reparameterization trick
        pz = dist.Normal(z_p_loc, z_p_scale)
        
        return x_len, x_len_scale, x_bar, x_bar_scale, x_col, qz, pz, z_q

    def loss_function(self, d, x, y, out_len, out_bar, out_col):
        
        x_len, x_len_scale, x_bar, x_bar_scale, x_col, qz, pz, z_q = self.forward(d, x, y)
        mask = 1 - F.one_hot(torch.round(out_len).to(torch.int64)*2-1, 200).cumsum(dim=1)[:,None,:]
        mask1 = (1 - F.one_hot(torch.round(out_len).to(torch.int64)-1, 100).cumsum(dim=1)[:,None,:]).repeat(1,2,1)

        
        #x_bar = mask.repeat(1,1,1)*x_bar
        
        #x_bar_scale = mask.repeat(1,1,1)*x_bar_scale
        x_col = mask.repeat(1,5,1)*x_col
        
        
        dist_len = dist.Normal(x_len, x_len_scale+1e-7)
        log_len = dist_len.log_prob(out_len[:,None]).mean()
        
       # dist_bar = dist.Normal(x_bar, x_bar_scale+1e-7)
        #log_bar = dist_bar.log_prob(out_bar)*mask1
        #log_bar = (log_bar).sum(dim=(1,2)).mean()
        
        mse_bar = ((((x_bar - out_bar)**2)*mask1).sum(dim=(1,2))/(mask1.sum(dim=(1,2)))).sum()#.detach().item()
        
        max_bar = torch.argmax(x_col, dim=1)
        #acc_bar = (((max_bar==out_col)*mask).sum(dim=(1,2))/mask.sum(dim=(1,2))).sum().detach().item()/5
        acc_bar = (max_bar==torch.argmax(out_col, dim=1)).sum().float()
        
        CE_len = -log_len
        CE_bar = mse_bar#-log_bar
        CE_col = F.cross_entropy(x_col, out_col, reduction='sum')

        KL_z = torch.sum(pz.log_prob(z_q) - qz.log_prob(z_q))
          
        return self.rec_alpha * CE_len \
                  + self.rec_beta * CE_bar \
                  + self.rec_gamma * CE_col \
                  - self.beta * KL_z, \
                  CE_bar, CE_len, CE_col, mse_bar, acc_bar

In [15]:
default_args = diva_args(z_dim=1600, rec_alpha = 10, rec_beta = 10, rec_gamma = 10, 
                         beta=1, warmup=1, prewarmup=0)
enc = StampDIVA(default_args)
summary(enc,[ (1,1),(1,3,25,100),(1,1)])

Layer (type:depth-idx)                   Output Shape              Param #
StampDIVA                                --                        --
├─qz: 1-1                                [1, 1600]                 --
│    └─Sequential: 2-1                   [1, 256, 2, 11]           --
│    │    └─Conv2d: 3-1                  [1, 64, 25, 100]          4,800
│    │    └─ReLU: 3-2                    [1, 64, 25, 100]          --
│    │    └─MaxPool2d: 3-3               [1, 64, 12, 50]           --
│    │    └─Conv2d: 3-4                  [1, 128, 12, 50]          73,728
│    │    └─ReLU: 3-5                    [1, 128, 12, 50]          --
│    │    └─MaxPool2d: 3-6               [1, 128, 6, 25]           --
│    │    └─Conv2d: 3-7                  [1, 256, 4, 23]           294,912
│    │    └─ReLU: 3-8                    [1, 256, 4, 23]           --
│    │    └─MaxPool2d: 3-9               [1, 256, 2, 11]           --
│    └─Sequential: 2-2                   [1, 1600]                 --
│  

# Training the model

## Loading dataset

In [16]:
RNA_dataset = MicroRNADataset(create_encodings=False)

Loading Labels! (~10s)
loading encodings
Loading Names! (~5s)


In [17]:
RNA_dataset_test = MicroRNADataset('test', create_encodings=False)

Loading Labels! (~10s)
loading encodings
Loading Names! (~5s)


In [18]:
len(RNA_dataset)

34721

In [19]:
def train_single_epoch(train_loader, model, optimizer, epoch):
    model.train()
    train_loss = 0
    epoch_bar_loss = 0
    epoch_col_loss = 0
    epoch_len_loss = 0
    no_batches = 0
    train_corr = 0
    mse_bar = 0
    acc_bar = 0
    pbar = tqdm(enumerate(train_loader), unit="batch", 
                                     desc=f'Epoch {epoch}')
    for batch_idx, (x, y, d, x_len, x_col, x_bar) in pbar:
        # To device
        x, y, d , x_len, x_bar, x_col = x.to(DEVICE), y.to(DEVICE), d.to(DEVICE), x_len.to(DEVICE), x_bar.to(DEVICE), x_col.to(DEVICE)

        optimizer.zero_grad()
        loss, bar_loss, len_loss, col_loss, mse, acc = model.loss_function(d.float(), x.float(), y.float(), x_len.float(), x_bar.float(), x_col.float())
      
        loss.backward()
        optimizer.step()
        pbar.set_postfix(loss=loss.item()/x.shape[0])
        train_loss += loss
        epoch_bar_loss += bar_loss
        epoch_col_loss += col_loss
        epoch_len_loss += len_loss
        mse_bar += mse
        acc_bar += acc
        no_batches += 1

    train_loss /= len(train_loader.dataset)
    epoch_bar_loss /= len(train_loader.dataset)
    epoch_len_loss /= len(train_loader.dataset)
    epoch_col_loss /= len(train_loader.dataset)
    acc_bar /= len(train_loader.dataset)
    mse_bar /= len(train_loader.dataset)
    
    return train_loss, epoch_bar_loss, epoch_len_loss, epoch_col_loss, mse_bar, acc_bar

In [20]:
def test_single_epoch(test_loader, model, epoch):
    model.eval()
    test_loss = 0
    epoch_bar_loss = 0
    epoch_col_loss = 0
    epoch_len_loss = 0
    mse_bar = 0
    acc_bar = 0        
    with torch.no_grad():
        for batch_idx, (x,y,d,x_len,x_col,x_bar) in enumerate(test_loader):
            x, y, d, x_len, x_bar, x_col = x.to(DEVICE), y.to(DEVICE), d.to(DEVICE), x_len.to(DEVICE), x_bar.to(DEVICE), x_col.to(DEVICE)
            loss, bar_loss, len_loss, col_loss, mse, acc = model.loss_function(d.float(), x.float(), y.float(),x_len.float(),x_bar.float(),x_col.float())
            test_loss += loss
            epoch_bar_loss += bar_loss
            epoch_col_loss += col_loss
            epoch_len_loss += len_loss
            mse_bar += mse
            acc_bar += acc
    test_loss /= len(test_loader.dataset)
    epoch_bar_loss /= len(test_loader.dataset)
    epoch_len_loss /= len(test_loader.dataset)
    epoch_col_loss /= len(test_loader.dataset)
    acc_bar /= len(test_loader.dataset)
    mse_bar /= len(test_loader.dataset)
    
    return test_loss, epoch_bar_loss, epoch_len_loss, epoch_col_loss, mse_bar, acc_bar
  

In [21]:
def train(args, train_loader, test_loader, diva, optimizer, end_epoch, start_epoch=0, save_folder='sd_1.0.0',save_interval=5):
    
    epoch_loss_sup = []
    test_loss = []
    
    for epoch in range(start_epoch+1, end_epoch+1):
        diva.beta = min([args.beta, args.beta * (epoch - args.prewarmup * 1.) / (args.warmup)])
        if epoch< args.prewarmup:
            diva.beta = args.beta/args.prewarmup
        train_loss, avg_loss_bar, avg_loss_len, avg_loss_col, mtr, atr = train_single_epoch(train_loader, diva, optimizer, epoch)
        str_loss_sup = train_loss
        epoch_loss_sup.append(train_loss)
        str_print = "epoch {}: avg train loss {:.2f}".format(epoch, str_loss_sup)
        str_print += ", bar train loss {:.3f}".format(avg_loss_bar)
        str_print += ", len train loss {:.3f}".format(avg_loss_len)
        str_print += ", col train loss {:.3f}".format(avg_loss_col)
        print(str_print)

        rec_loss_train = diva.rec_alpha * avg_loss_len + diva.rec_beta * avg_loss_bar + diva.rec_gamma * avg_loss_col
        dis_loss_train = train_loss - rec_loss_train

        test_lss, avg_loss_bar_test, avg_loss_len_test, avg_loss_col_test, mte, ate = test_single_epoch(test_loader, diva, epoch)
        test_loss.append(test_lss)
       
        str_print = "epoch {}: avg test  loss {:.2f}".format(epoch, test_lss)
        str_print += ", bar  test loss {:.3f}".format(avg_loss_bar_test)
        str_print += ", len  test loss {:.3f}".format(avg_loss_len_test)
        str_print += ", col  test loss {:.3f}".format(avg_loss_col_test)
        print(str_print)

        rec_loss_test = diva.rec_alpha * avg_loss_len_test + diva.rec_beta * avg_loss_bar_test + diva.rec_gamma * avg_loss_col_test
        dis_loss_test = test_lss - rec_loss_test

        if writer is not None:
            
            writer.add_scalars("Total_Loss", {'train': train_loss, 'test': test_lss} ,epoch)
            writer.add_scalars("Reconstruction_vs_Disentanglement",{'rec':rec_loss_train, 'dis':dis_loss_train}, epoch)
            writer.add_scalars("bar_mse",{'train': mtr, 'test':mte}, epoch)
            writer.add_scalars("bar_acc",{'train': atr, 'test':ate}, epoch)

        if epoch % save_interval == 0:
            save_reconstructions(epoch, test_loader, diva, name=save_folder)
            save_reconstructions(epoch, train_loader, diva, name=save_folder, estr='tr')
        
        
        if epoch % 50 == 0:
            torch.save(diva.state_dict(), f'{link}/saved_models/{save_folder}/checkpoints/{epoch}.pth')

    if writer is not None:
        writer.flush()

    epoch_loss_sup = [i.cpu().detach().numpy() for i in epoch_loss_sup]
    test_loss = [i.cpu().detach().numpy() for i in test_loss]
    return epoch_loss_sup, test_loss

In [22]:
def save_reconstructions(epoch, test_loader, diva, name='diva', estr=''):
    a = next(enumerate(test_loader))
    with torch.no_grad():
        diva.eval()
        d = a[1][2][:10].to(DEVICE).float()
        x = a[1][0][:10].to(DEVICE).float()
        y = a[1][1][:10].to(DEVICE).float()
        x_1, x_1var, x_2, x_2var, x_3, _, _, _ = diva(d,x,y)
        out = diva.px.reconstruct_image(x_1, x_1var, x_2, x_2var, x_3)

    plt.figure(figsize=(80,20))
    fig, ax = plt.subplots(nrows=10, ncols=2)

    ax[0,0].set_title("Original")
    ax[0,1].set_title("Reconstructed")

    for i in range(10):
        ax[i, 1].imshow(out[i])
        ax[i, 0].imshow(x[i].cpu().permute(1,2,0))
        ax[i, 0].xaxis.set_visible(False)
        ax[i, 0].yaxis.set_visible(False)
        ax[i, 1].xaxis.set_visible(False)
        ax[i, 1].yaxis.set_visible(False)
    fig.tight_layout(pad=0.1)
    plt.savefig(f'{link}/saved_models/{name}/reconstructions/e{epoch}{estr}.png')
    plt.close('all')

In [23]:
DEVICE

device(type='cuda')

## Model Training

In [24]:
default_args = diva_args(z_dim=2048, rec_alpha = 100, rec_beta = 20, rec_gamma = 5, 
                         beta=1, warmup=1, prewarmup=0)

In [25]:
diva = StampDIVA(default_args).to(DEVICE)

In [26]:
#diva.load_state_dict(torch.load(f'{link}/saved_models/VAE10/checkpoints/905.pth'))

In [27]:
train_loader = DataLoader(RNA_dataset, batch_size=128, shuffle=True)
test_loader = DataLoader(RNA_dataset_test, batch_size=128)

In [28]:
#optimizer = optim.SGD(diva.parameters(), lr=0.00001, momentum=0.1, nesterov=True)
optimizer = optim.Adam(diva.parameters(), lr=0.0001)

In [29]:
RNA_dataset.x_len.min(), RNA_dataset.x_len.max()

(10, 100)

In [30]:
writer.flush()

In [31]:
%tensorboard --logdir="D:/users/Marko/downloads/mirna/saved_models/VAEFC/tensorboard/"

Reusing TensorBoard on port 6006 (pid 29544), started 0:31:12 ago. (Use '!kill 29544' to kill it.)

In [None]:
lss, lss_t = train(default_args, train_loader, test_loader, diva, optimizer, 500, 5, save_folder="VAEFC",save_interval=5)

Epoch 6: 272batch [00:18, 14.58batch/s, loss=1.13e+3]


epoch 6: avg train loss 1209.10, bar train loss 12.152, len train loss 0.945, col train loss 169.649
epoch 6: avg test  loss 1079.04, bar  test loss 10.618, len  test loss 0.113, col  test loss 169.453


Epoch 7: 272batch [00:18, 14.69batch/s, loss=1.12e+3]


epoch 7: avg train loss 1069.61, bar train loss 10.121, len train loss 0.103, col train loss 169.476


Epoch 8: 2batch [00:00, 14.71batch/s, loss=1.12e+3]

epoch 7: avg test  loss 1065.86, bar  test loss 9.959, len  test loss 0.096, col  test loss 169.400


Epoch 8: 272batch [00:18, 14.70batch/s, loss=1e+3]   


epoch 8: avg train loss 1054.75, bar train loss 9.345, len train loss 0.095, col train loss 169.306


Epoch 9: 2batch [00:00, 14.81batch/s, loss=1.06e+3]

epoch 8: avg test  loss 1040.62, bar  test loss 8.647, len  test loss 0.087, col  test loss 169.019


Epoch 9: 272batch [00:18, 14.54batch/s, loss=985]    


epoch 9: avg train loss 1031.51, bar train loss 8.260, len train loss 0.091, col train loss 168.458


Epoch 10: 2batch [00:00, 14.81batch/s, loss=1.02e+3]

epoch 9: avg test  loss 1020.98, bar  test loss 7.848, len  test loss 0.091, col  test loss 167.702


Epoch 10: 272batch [00:18, 14.54batch/s, loss=1.04e+3]


epoch 10: avg train loss 1013.57, bar train loss 7.522, len train loss 0.091, col train loss 167.307
epoch 10: avg test  loss 1008.23, bar  test loss 7.223, len  test loss 0.097, col  test loss 167.100


Epoch 11: 272batch [00:18, 14.65batch/s, loss=1.04e+3]


epoch 11: avg train loss 1002.50, bar train loss 6.996, len train loss 0.091, col train loss 166.804


Epoch 12: 2batch [00:00, 13.99batch/s, loss=1.03e+3]

epoch 11: avg test  loss 998.33, bar  test loss 6.836, len  test loss 0.097, col  test loss 166.545


Epoch 12: 272batch [00:18, 14.64batch/s, loss=1.08e+3]


epoch 12: avg train loss 994.69, bar train loss 6.659, len train loss 0.091, col train loss 166.338


Epoch 13: 2batch [00:00, 14.93batch/s, loss=1.02e+3]

epoch 12: avg test  loss 991.96, bar  test loss 6.437, len  test loss 0.111, col  test loss 166.113


Epoch 13: 272batch [00:18, 14.66batch/s, loss=1.09e+3]


epoch 13: avg train loss 986.89, bar train loss 6.309, len train loss 0.090, col train loss 165.890


Epoch 14: 2batch [00:00, 14.93batch/s, loss=995]

epoch 13: avg test  loss 983.25, bar  test loss 6.160, len  test loss 0.087, col  test loss 165.733


Epoch 14: 272batch [00:18, 14.67batch/s, loss=1.06e+3]


epoch 14: avg train loss 980.84, bar train loss 6.057, len train loss 0.089, col train loss 165.445


Epoch 15: 2batch [00:00, 14.49batch/s, loss=983]

epoch 14: avg test  loss 978.62, bar  test loss 5.933, len  test loss 0.089, col  test loss 165.368


Epoch 15: 272batch [00:18, 14.47batch/s, loss=1.08e+3]


epoch 15: avg train loss 975.28, bar train loss 5.813, len train loss 0.090, col train loss 165.043
epoch 15: avg test  loss 972.66, bar  test loss 5.676, len  test loss 0.088, col  test loss 164.917


Epoch 16: 272batch [00:18, 14.48batch/s, loss=1.04e+3]


epoch 16: avg train loss 970.14, bar train loss 5.615, len train loss 0.089, col train loss 164.604


Epoch 17: 2batch [00:00, 14.93batch/s, loss=977]

epoch 16: avg test  loss 967.66, bar  test loss 5.534, len  test loss 0.085, col  test loss 164.506


Epoch 17: 272batch [00:18, 14.67batch/s, loss=987]    


epoch 17: avg train loss 965.63, bar train loss 5.454, len train loss 0.088, col train loss 164.197


Epoch 18: 2batch [00:00, 14.08batch/s, loss=969]

epoch 17: avg test  loss 965.18, bar  test loss 5.380, len  test loss 0.097, col  test loss 164.118


Epoch 18: 272batch [00:18, 14.41batch/s, loss=897]    


epoch 18: avg train loss 961.25, bar train loss 5.301, len train loss 0.087, col train loss 163.798


Epoch 19: 2batch [00:00, 14.81batch/s, loss=927]

epoch 18: avg test  loss 959.54, bar  test loss 5.216, len  test loss 0.086, col  test loss 163.782


Epoch 19: 272batch [00:18, 14.63batch/s, loss=920]    


epoch 19: avg train loss 957.68, bar train loss 5.150, len train loss 0.087, col train loss 163.530


Epoch 20: 2batch [00:00, 14.49batch/s, loss=943]

epoch 19: avg test  loss 957.09, bar  test loss 5.110, len  test loss 0.085, col  test loss 163.639


Epoch 20: 272batch [00:18, 14.60batch/s, loss=951]    


epoch 20: avg train loss 954.87, bar train loss 5.040, len train loss 0.088, col train loss 163.295
epoch 20: avg test  loss 953.82, bar  test loss 4.987, len  test loss 0.088, col  test loss 163.403


Epoch 21: 272batch [00:19, 14.27batch/s, loss=972]    


epoch 21: avg train loss 952.14, bar train loss 4.935, len train loss 0.086, col train loss 163.107


Epoch 22: 2batch [00:00, 14.49batch/s, loss=932]

epoch 21: avg test  loss 954.05, bar  test loss 4.908, len  test loss 0.099, col  test loss 163.323


Epoch 22: 272batch [00:18, 14.62batch/s, loss=952]    


epoch 22: avg train loss 949.54, bar train loss 4.827, len train loss 0.085, col train loss 162.946


Epoch 23: 2batch [00:00, 14.60batch/s, loss=929]

epoch 22: avg test  loss 949.11, bar  test loss 4.741, len  test loss 0.086, col  test loss 163.084


Epoch 23: 272batch [00:18, 14.60batch/s, loss=887]    


epoch 23: avg train loss 947.32, bar train loss 4.733, len train loss 0.084, col train loss 162.803


Epoch 24: 2batch [00:00, 14.71batch/s, loss=964]

epoch 23: avg test  loss 946.62, bar  test loss 4.673, len  test loss 0.084, col  test loss 162.966


Epoch 24: 272batch [00:18, 14.32batch/s, loss=970]    


epoch 24: avg train loss 944.82, bar train loss 4.642, len train loss 0.083, col train loss 162.619


Epoch 25: 2batch [00:00, 14.71batch/s, loss=950]

epoch 24: avg test  loss 946.16, bar  test loss 4.642, len  test loss 0.088, col  test loss 162.861


Epoch 25: 272batch [00:18, 14.55batch/s, loss=924] 


epoch 25: avg train loss 943.24, bar train loss 4.576, len train loss 0.085, col train loss 162.458
epoch 25: avg test  loss 943.28, bar  test loss 4.517, len  test loss 0.082, col  test loss 162.636


Epoch 26: 272batch [00:18, 14.54batch/s, loss=1.01e+3]


epoch 26: avg train loss 941.04, bar train loss 4.504, len train loss 0.082, col train loss 162.264


Epoch 27: 2batch [00:00, 14.71batch/s, loss=957]

epoch 26: avg test  loss 941.54, bar  test loss 4.468, len  test loss 0.082, col  test loss 162.446


Epoch 27: 272batch [00:19, 14.13batch/s, loss=868]   


epoch 27: avg train loss 938.92, bar train loss 4.432, len train loss 0.083, col train loss 162.011


Epoch 28: 2batch [00:00, 14.29batch/s, loss=903]

epoch 27: avg test  loss 940.14, bar  test loss 4.473, len  test loss 0.081, col  test loss 162.270


Epoch 28: 272batch [00:18, 14.52batch/s, loss=948]


epoch 28: avg train loss 937.17, bar train loss 4.380, len train loss 0.081, col train loss 161.843


Epoch 29: 2batch [00:00, 14.49batch/s, loss=973]

epoch 28: avg test  loss 938.17, bar  test loss 4.363, len  test loss 0.089, col  test loss 162.096


Epoch 29: 272batch [00:18, 14.56batch/s, loss=924]    


epoch 29: avg train loss 935.48, bar train loss 4.325, len train loss 0.081, col train loss 161.675


Epoch 30: 2batch [00:00, 14.71batch/s, loss=946]

epoch 29: avg test  loss 936.07, bar  test loss 4.311, len  test loss 0.080, col  test loss 161.908


Epoch 30: 272batch [00:19, 14.25batch/s, loss=974]   


epoch 30: avg train loss 934.08, bar train loss 4.279, len train loss 0.081, col train loss 161.522
epoch 30: avg test  loss 934.22, bar  test loss 4.265, len  test loss 0.078, col  test loss 161.761


Epoch 31: 272batch [00:18, 14.54batch/s, loss=932]   


epoch 31: avg train loss 932.11, bar train loss 4.222, len train loss 0.079, col train loss 161.338


Epoch 32: 2batch [00:00, 14.39batch/s, loss=951]

epoch 31: avg test  loss 934.13, bar  test loss 4.214, len  test loss 0.083, col  test loss 161.623


Epoch 32: 272batch [00:18, 14.55batch/s, loss=994]


epoch 32: avg train loss 931.15, bar train loss 4.179, len train loss 0.080, col train loss 161.221


Epoch 33: 2batch [00:00, 14.29batch/s, loss=945]

epoch 32: avg test  loss 933.05, bar  test loss 4.182, len  test loss 0.086, col  test loss 161.525


Epoch 33: 272batch [00:18, 14.55batch/s, loss=1.03e+3]


epoch 33: avg train loss 929.71, bar train loss 4.143, len train loss 0.079, col train loss 161.045


Epoch 34: 2batch [00:00, 14.71batch/s, loss=920]

epoch 33: avg test  loss 931.51, bar  test loss 4.154, len  test loss 0.079, col  test loss 161.396


Epoch 34: 272batch [00:19, 14.31batch/s, loss=932]   


epoch 34: avg train loss 928.30, bar train loss 4.102, len train loss 0.079, col train loss 160.897


Epoch 35: 2batch [00:00, 14.71batch/s, loss=928]

epoch 34: avg test  loss 930.08, bar  test loss 4.104, len  test loss 0.081, col  test loss 161.261


Epoch 35: 272batch [00:18, 14.55batch/s, loss=942]


epoch 35: avg train loss 926.95, bar train loss 4.065, len train loss 0.077, col train loss 160.761
epoch 35: avg test  loss 928.71, bar  test loss 4.043, len  test loss 0.080, col  test loss 161.150


Epoch 36: 272batch [00:18, 14.53batch/s, loss=1.02e+3]


epoch 36: avg train loss 925.98, bar train loss 4.026, len train loss 0.078, col train loss 160.677


Epoch 37: 2batch [00:00, 14.81batch/s, loss=933]

epoch 36: avg test  loss 928.31, bar  test loss 4.015, len  test loss 0.083, col  test loss 161.071


Epoch 37: 272batch [00:18, 14.56batch/s, loss=927]


epoch 37: avg train loss 924.90, bar train loss 3.995, len train loss 0.076, col train loss 160.578


Epoch 38: 2batch [00:00, 14.71batch/s, loss=938]

epoch 37: avg test  loss 927.12, bar  test loss 4.022, len  test loss 0.076, col  test loss 161.025


Epoch 38: 272batch [00:18, 14.56batch/s, loss=928]


epoch 38: avg train loss 924.32, bar train loss 3.972, len train loss 0.077, col train loss 160.487


Epoch 39: 2batch [00:00, 14.18batch/s, loss=945]

epoch 38: avg test  loss 926.59, bar  test loss 4.011, len  test loss 0.077, col  test loss 160.943


Epoch 39: 272batch [00:18, 14.49batch/s, loss=945]


epoch 39: avg train loss 923.30, bar train loss 3.941, len train loss 0.077, col train loss 160.380


Epoch 40: 2batch [00:00, 14.60batch/s, loss=928]

epoch 39: avg test  loss 925.51, bar  test loss 3.964, len  test loss 0.078, col  test loss 160.799


Epoch 40: 272batch [00:18, 14.49batch/s, loss=898]


epoch 40: avg train loss 922.22, bar train loss 3.912, len train loss 0.075, col train loss 160.260
epoch 40: avg test  loss 924.32, bar  test loss 3.917, len  test loss 0.072, col  test loss 160.718


Epoch 41: 272batch [00:18, 14.53batch/s, loss=939]


epoch 41: avg train loss 921.34, bar train loss 3.883, len train loss 0.076, col train loss 160.132


Epoch 42: 2batch [00:00, 13.79batch/s, loss=922]

epoch 41: avg test  loss 924.54, bar  test loss 3.937, len  test loss 0.078, col  test loss 160.628


Epoch 42: 272batch [00:19, 13.94batch/s, loss=889]


epoch 42: avg train loss 920.57, bar train loss 3.862, len train loss 0.075, col train loss 160.044


Epoch 43: 2batch [00:00, 14.49batch/s, loss=892]

epoch 42: avg test  loss 923.14, bar  test loss 3.851, len  test loss 0.075, col  test loss 160.534


Epoch 43: 272batch [00:18, 14.55batch/s, loss=985]


epoch 43: avg train loss 919.04, bar train loss 3.832, len train loss 0.075, col train loss 159.803


Epoch 44: 2batch [00:00, 14.29batch/s, loss=899]

epoch 43: avg test  loss 921.13, bar  test loss 3.846, len  test loss 0.073, col  test loss 160.250


Epoch 44: 272batch [00:18, 14.50batch/s, loss=1.08e+3]


epoch 44: avg train loss 917.34, bar train loss 3.805, len train loss 0.075, col train loss 159.540


Epoch 45: 2batch [00:00, 12.90batch/s, loss=913]

epoch 44: avg test  loss 921.48, bar  test loss 3.864, len  test loss 0.077, col  test loss 160.102


Epoch 45: 272batch [00:18, 14.35batch/s, loss=962]


epoch 45: avg train loss 916.35, bar train loss 3.785, len train loss 0.073, col train loss 159.396
epoch 45: avg test  loss 919.63, bar  test loss 3.817, len  test loss 0.074, col  test loss 160.016


Epoch 46: 272batch [00:18, 14.48batch/s, loss=913]


epoch 46: avg train loss 915.65, bar train loss 3.769, len train loss 0.073, col train loss 159.266


Epoch 47: 2batch [00:00, 14.39batch/s, loss=937]

epoch 46: avg test  loss 918.72, bar  test loss 3.812, len  test loss 0.076, col  test loss 159.809


Epoch 47: 272batch [00:18, 14.55batch/s, loss=992]


epoch 47: avg train loss 914.28, bar train loss 3.744, len train loss 0.073, col train loss 159.060


Epoch 48: 2batch [00:00, 14.49batch/s, loss=904]

epoch 47: avg test  loss 917.49, bar  test loss 3.754, len  test loss 0.076, col  test loss 159.743


Epoch 48: 272batch [00:18, 14.53batch/s, loss=975]


epoch 48: avg train loss 913.54, bar train loss 3.725, len train loss 0.074, col train loss 158.927


Epoch 49: 2batch [00:00, 14.60batch/s, loss=893]

epoch 48: avg test  loss 918.14, bar  test loss 3.769, len  test loss 0.077, col  test loss 159.594


Epoch 49: 272batch [00:19, 14.27batch/s, loss=988]


epoch 49: avg train loss 912.71, bar train loss 3.711, len train loss 0.072, col train loss 158.798


Epoch 50: 2batch [00:00, 14.60batch/s, loss=910]

epoch 49: avg test  loss 915.79, bar  test loss 3.728, len  test loss 0.069, col  test loss 159.432


Epoch 50: 272batch [00:18, 14.52batch/s, loss=902]


epoch 50: avg train loss 911.90, bar train loss 3.689, len train loss 0.071, col train loss 158.698
epoch 50: avg test  loss 915.50, bar  test loss 3.723, len  test loss 0.072, col  test loss 159.366


Epoch 51: 272batch [00:18, 14.50batch/s, loss=985]


epoch 51: avg train loss 911.19, bar train loss 3.672, len train loss 0.073, col train loss 158.564


Epoch 52: 2batch [00:00, 14.49batch/s, loss=888]

epoch 51: avg test  loss 914.55, bar  test loss 3.668, len  test loss 0.072, col  test loss 159.189


Epoch 52: 272batch [00:18, 14.48batch/s, loss=950]


epoch 52: avg train loss 910.28, bar train loss 3.653, len train loss 0.071, col train loss 158.460


Epoch 53: 2batch [00:00, 14.60batch/s, loss=883]

epoch 52: avg test  loss 913.71, bar  test loss 3.655, len  test loss 0.069, col  test loss 159.172


Epoch 53: 272batch [00:19, 14.31batch/s, loss=914]


epoch 53: avg train loss 909.24, bar train loss 3.637, len train loss 0.071, col train loss 158.298


Epoch 54: 2batch [00:00, 14.39batch/s, loss=923]

epoch 53: avg test  loss 913.09, bar  test loss 3.666, len  test loss 0.068, col  test loss 159.050


Epoch 54: 272batch [00:18, 14.50batch/s, loss=951]


epoch 54: avg train loss 908.59, bar train loss 3.627, len train loss 0.069, col train loss 158.206


Epoch 55: 2batch [00:00, 14.71batch/s, loss=885]

epoch 54: avg test  loss 912.31, bar  test loss 3.619, len  test loss 0.070, col  test loss 158.913


Epoch 55: 272batch [00:19, 14.23batch/s, loss=917]


epoch 55: avg train loss 907.82, bar train loss 3.600, len train loss 0.070, col train loss 158.080
epoch 55: avg test  loss 913.22, bar  test loss 3.684, len  test loss 0.077, col  test loss 158.916


Epoch 56: 272batch [00:19, 14.10batch/s, loss=905]


epoch 56: avg train loss 907.13, bar train loss 3.590, len train loss 0.069, col train loss 157.971


Epoch 57: 2batch [00:00, 14.60batch/s, loss=921]

epoch 56: avg test  loss 911.52, bar  test loss 3.650, len  test loss 0.074, col  test loss 158.747


Epoch 57: 272batch [00:18, 14.46batch/s, loss=978]


epoch 57: avg train loss 906.57, bar train loss 3.581, len train loss 0.070, col train loss 157.847


Epoch 58: 2batch [00:00, 14.71batch/s, loss=949]

epoch 57: avg test  loss 911.53, bar  test loss 3.617, len  test loss 0.077, col  test loss 158.546


Epoch 58: 272batch [00:18, 14.40batch/s, loss=917]


epoch 58: avg train loss 905.55, bar train loss 3.559, len train loss 0.069, col train loss 157.700


Epoch 59: 2batch [00:00, 14.18batch/s, loss=878]

epoch 58: avg test  loss 909.89, bar  test loss 3.587, len  test loss 0.067, col  test loss 158.543


Epoch 59: 272batch [00:18, 14.55batch/s, loss=829]


epoch 59: avg train loss 904.63, bar train loss 3.542, len train loss 0.067, col train loss 157.600


Epoch 60: 2batch [00:00, 14.39batch/s, loss=905]

epoch 59: avg test  loss 909.49, bar  test loss 3.571, len  test loss 0.068, col  test loss 158.450


Epoch 60: 272batch [00:18, 14.54batch/s, loss=839]


epoch 60: avg train loss 904.22, bar train loss 3.537, len train loss 0.066, col train loss 157.515
epoch 60: avg test  loss 909.27, bar  test loss 3.585, len  test loss 0.070, col  test loss 158.376


Epoch 61: 272batch [00:19, 14.12batch/s, loss=935]


epoch 61: avg train loss 903.52, bar train loss 3.522, len train loss 0.067, col train loss 157.410


Epoch 62: 2batch [00:00, 14.71batch/s, loss=929]

epoch 61: avg test  loss 908.97, bar  test loss 3.564, len  test loss 0.072, col  test loss 158.317


Epoch 62: 272batch [00:18, 14.53batch/s, loss=905]


epoch 62: avg train loss 902.52, bar train loss 3.506, len train loss 0.063, col train loss 157.322


Epoch 63: 2batch [00:00, 14.60batch/s, loss=910]

epoch 62: avg test  loss 907.37, bar  test loss 3.538, len  test loss 0.065, col  test loss 158.216


Epoch 63: 272batch [00:18, 14.56batch/s, loss=838]


epoch 63: avg train loss 901.69, bar train loss 3.499, len train loss 0.062, col train loss 157.193


Epoch 64: 2batch [00:00, 14.93batch/s, loss=903]

epoch 63: avg test  loss 906.91, bar  test loss 3.527, len  test loss 0.063, col  test loss 158.152


Epoch 64: 272batch [00:18, 14.35batch/s, loss=869]


epoch 64: avg train loss 900.60, bar train loss 3.485, len train loss 0.058, col train loss 157.102


Epoch 65: 2batch [00:00, 14.39batch/s, loss=922]

epoch 64: avg test  loss 905.54, bar  test loss 3.529, len  test loss 0.057, col  test loss 158.063


Epoch 65: 272batch [00:18, 14.36batch/s, loss=953]


epoch 65: avg train loss 899.63, bar train loss 3.472, len train loss 0.056, col train loss 156.962
epoch 65: avg test  loss 904.71, bar  test loss 3.513, len  test loss 0.054, col  test loss 157.967


Epoch 66: 272batch [00:18, 14.42batch/s, loss=846]


epoch 66: avg train loss 898.45, bar train loss 3.464, len train loss 0.052, col train loss 156.861


Epoch 67: 2batch [00:00, 14.39batch/s, loss=881]

epoch 66: avg test  loss 904.76, bar  test loss 3.504, len  test loss 0.055, col  test loss 157.932


Epoch 67: 272batch [00:18, 14.47batch/s, loss=873]


epoch 67: avg train loss 897.78, bar train loss 3.450, len train loss 0.051, col train loss 156.786


Epoch 68: 2batch [00:00, 14.71batch/s, loss=906]

epoch 67: avg test  loss 903.49, bar  test loss 3.537, len  test loss 0.052, col  test loss 157.800


Epoch 68: 272batch [00:19, 14.28batch/s, loss=871]


epoch 68: avg train loss 896.59, bar train loss 3.448, len train loss 0.048, col train loss 156.601


Epoch 69: 2batch [00:00, 14.39batch/s, loss=889]

epoch 68: avg test  loss 901.95, bar  test loss 3.497, len  test loss 0.046, col  test loss 157.598


Epoch 69: 272batch [00:18, 14.46batch/s, loss=945]


epoch 69: avg train loss 895.29, bar train loss 3.438, len train loss 0.046, col train loss 156.425


Epoch 70: 2batch [00:00, 14.39batch/s, loss=894]

epoch 69: avg test  loss 901.99, bar  test loss 3.490, len  test loss 0.053, col  test loss 157.503


Epoch 70: 272batch [00:18, 14.48batch/s, loss=1e+3]


epoch 70: avg train loss 894.42, bar train loss 3.426, len train loss 0.044, col train loss 156.300
epoch 70: avg test  loss 900.55, bar  test loss 3.470, len  test loss 0.042, col  test loss 157.429


Epoch 71: 272batch [00:19, 14.10batch/s, loss=913]


epoch 71: avg train loss 893.44, bar train loss 3.420, len train loss 0.041, col train loss 156.199


Epoch 72: 2batch [00:00, 14.81batch/s, loss=880]

epoch 71: avg test  loss 899.82, bar  test loss 3.501, len  test loss 0.041, col  test loss 157.286


Epoch 72: 272batch [00:18, 14.48batch/s, loss=838]


epoch 72: avg train loss 892.65, bar train loss 3.404, len train loss 0.040, col train loss 156.086


Epoch 73: 2batch [00:00, 14.49batch/s, loss=888]

epoch 72: avg test  loss 899.07, bar  test loss 3.475, len  test loss 0.042, col  test loss 157.199


Epoch 73: 272batch [00:18, 14.42batch/s, loss=936]


epoch 73: avg train loss 891.50, bar train loss 3.394, len train loss 0.038, col train loss 155.937


Epoch 74: 2batch [00:00, 13.89batch/s, loss=874]

epoch 73: avg test  loss 897.81, bar  test loss 3.420, len  test loss 0.038, col  test loss 157.092


Epoch 74: 272batch [00:19, 14.30batch/s, loss=943]


epoch 74: avg train loss 890.63, bar train loss 3.386, len train loss 0.038, col train loss 155.778


Epoch 75: 2batch [00:00, 14.60batch/s, loss=871]

epoch 74: avg test  loss 896.80, bar  test loss 3.432, len  test loss 0.036, col  test loss 156.921


Epoch 75: 272batch [00:19, 14.31batch/s, loss=825]


epoch 75: avg train loss 890.00, bar train loss 3.382, len train loss 0.037, col train loss 155.661
epoch 75: avg test  loss 896.45, bar  test loss 3.413, len  test loss 0.035, col  test loss 156.821


Epoch 76: 272batch [00:19, 14.28batch/s, loss=865]


epoch 76: avg train loss 889.17, bar train loss 3.365, len train loss 0.035, col train loss 155.575


Epoch 77: 2batch [00:00, 14.18batch/s, loss=882]

epoch 76: avg test  loss 895.98, bar  test loss 3.424, len  test loss 0.037, col  test loss 156.798


Epoch 77: 272batch [00:18, 14.41batch/s, loss=967]


epoch 77: avg train loss 888.61, bar train loss 3.360, len train loss 0.036, col train loss 155.466


Epoch 78: 2batch [00:00, 14.71batch/s, loss=879]

epoch 77: avg test  loss 895.31, bar  test loss 3.415, len  test loss 0.034, col  test loss 156.673


Epoch 78: 272batch [00:18, 14.43batch/s, loss=885]


epoch 78: avg train loss 887.83, bar train loss 3.347, len train loss 0.035, col train loss 155.329


Epoch 79: 2batch [00:00, 13.70batch/s, loss=870]

epoch 78: avg test  loss 894.62, bar  test loss 3.417, len  test loss 0.033, col  test loss 156.565


Epoch 79: 272batch [00:19, 14.08batch/s, loss=917]


epoch 79: avg train loss 887.10, bar train loss 3.335, len train loss 0.034, col train loss 155.212


Epoch 80: 2batch [00:00, 14.08batch/s, loss=933]

epoch 79: avg test  loss 894.33, bar  test loss 3.428, len  test loss 0.034, col  test loss 156.489


Epoch 80: 272batch [00:18, 14.43batch/s, loss=863]


epoch 80: avg train loss 886.21, bar train loss 3.326, len train loss 0.033, col train loss 155.074
epoch 80: avg test  loss 894.21, bar  test loss 3.389, len  test loss 0.039, col  test loss 156.386


Epoch 81: 272batch [00:19, 14.18batch/s, loss=855]


epoch 81: avg train loss 885.45, bar train loss 3.320, len train loss 0.033, col train loss 154.918


Epoch 82: 2batch [00:00, 14.49batch/s, loss=849]

epoch 81: avg test  loss 893.14, bar  test loss 3.355, len  test loss 0.032, col  test loss 156.275


Epoch 82: 272batch [00:19, 14.29batch/s, loss=888]


epoch 82: avg train loss 884.64, bar train loss 3.302, len train loss 0.033, col train loss 154.812


Epoch 83: 2batch [00:00, 14.29batch/s, loss=891]

epoch 82: avg test  loss 892.48, bar  test loss 3.336, len  test loss 0.032, col  test loss 156.195


Epoch 83: 272batch [00:19, 14.24batch/s, loss=892]


epoch 83: avg train loss 884.09, bar train loss 3.296, len train loss 0.032, col train loss 154.721


Epoch 84: 2batch [00:00, 13.89batch/s, loss=844]

epoch 83: avg test  loss 892.23, bar  test loss 3.364, len  test loss 0.031, col  test loss 156.084


Epoch 84: 272batch [00:19, 14.19batch/s, loss=937]


epoch 84: avg train loss 883.74, bar train loss 3.289, len train loss 0.031, col train loss 154.650


Epoch 85: 2batch [00:00, 13.89batch/s, loss=875]

epoch 84: avg test  loss 891.57, bar  test loss 3.323, len  test loss 0.034, col  test loss 156.023


Epoch 85: 272batch [00:19, 14.12batch/s, loss=811]


epoch 85: avg train loss 882.87, bar train loss 3.276, len train loss 0.032, col train loss 154.496
epoch 85: avg test  loss 891.27, bar  test loss 3.352, len  test loss 0.031, col  test loss 155.968


Epoch 86: 272batch [00:18, 14.35batch/s, loss=845]


epoch 86: avg train loss 882.24, bar train loss 3.265, len train loss 0.032, col train loss 154.387


Epoch 87: 2batch [00:00, 14.71batch/s, loss=880]

epoch 86: avg test  loss 890.45, bar  test loss 3.335, len  test loss 0.031, col  test loss 155.832


Epoch 87: 272batch [00:18, 14.35batch/s, loss=795]


epoch 87: avg train loss 881.82, bar train loss 3.260, len train loss 0.031, col train loss 154.296


Epoch 88: 2batch [00:00, 14.08batch/s, loss=908]

epoch 87: avg test  loss 890.98, bar  test loss 3.300, len  test loss 0.038, col  test loss 155.800


Epoch 88: 272batch [00:18, 14.33batch/s, loss=824]


epoch 88: avg train loss 881.34, bar train loss 3.249, len train loss 0.031, col train loss 154.216


Epoch 89: 2batch [00:00, 14.39batch/s, loss=899]

epoch 88: avg test  loss 890.19, bar  test loss 3.300, len  test loss 0.033, col  test loss 155.809


Epoch 89: 272batch [00:18, 14.38batch/s, loss=904]


epoch 89: avg train loss 880.78, bar train loss 3.239, len train loss 0.031, col train loss 154.131


Epoch 90: 2batch [00:00, 14.49batch/s, loss=871]

epoch 89: avg test  loss 889.76, bar  test loss 3.296, len  test loss 0.031, col  test loss 155.684


Epoch 90: 272batch [00:18, 14.38batch/s, loss=955]


epoch 90: avg train loss 879.80, bar train loss 3.222, len train loss 0.030, col train loss 153.971
epoch 90: avg test  loss 888.72, bar  test loss 3.305, len  test loss 0.033, col  test loss 155.415


Epoch 91: 272batch [00:19, 13.90batch/s, loss=906]


epoch 91: avg train loss 878.99, bar train loss 3.213, len train loss 0.030, col train loss 153.834


Epoch 92: 2batch [00:00, 14.39batch/s, loss=869]

epoch 91: avg test  loss 887.81, bar  test loss 3.298, len  test loss 0.030, col  test loss 155.337


Epoch 92: 272batch [00:18, 14.35batch/s, loss=859]


epoch 92: avg train loss 878.47, bar train loss 3.203, len train loss 0.030, col train loss 153.722


Epoch 93: 2batch [00:00, 14.39batch/s, loss=929]

epoch 92: avg test  loss 887.48, bar  test loss 3.258, len  test loss 0.030, col  test loss 155.373


Epoch 93: 272batch [00:18, 14.36batch/s, loss=893]


epoch 93: avg train loss 877.81, bar train loss 3.186, len train loss 0.030, col train loss 153.640


Epoch 94: 2batch [00:00, 13.99batch/s, loss=875]

epoch 93: avg test  loss 887.34, bar  test loss 3.279, len  test loss 0.031, col  test loss 155.323


Epoch 94: 272batch [00:19, 14.02batch/s, loss=860]


epoch 94: avg train loss 877.29, bar train loss 3.176, len train loss 0.031, col train loss 153.537


Epoch 95: 2batch [00:00, 14.71batch/s, loss=896]

epoch 94: avg test  loss 887.25, bar  test loss 3.254, len  test loss 0.030, col  test loss 155.270


Epoch 95: 272batch [00:18, 14.36batch/s, loss=919]


epoch 95: avg train loss 876.68, bar train loss 3.171, len train loss 0.029, col train loss 153.452
epoch 95: avg test  loss 886.92, bar  test loss 3.216, len  test loss 0.032, col  test loss 155.128


Epoch 96: 272batch [00:19, 14.27batch/s, loss=888]


epoch 96: avg train loss 876.26, bar train loss 3.159, len train loss 0.029, col train loss 153.368


Epoch 97: 2batch [00:00, 14.49batch/s, loss=886]

epoch 96: avg test  loss 886.04, bar  test loss 3.217, len  test loss 0.030, col  test loss 155.166


Epoch 97: 272batch [00:18, 14.44batch/s, loss=835]


epoch 97: avg train loss 875.70, bar train loss 3.143, len train loss 0.030, col train loss 153.289


Epoch 98: 2batch [00:00, 14.60batch/s, loss=899]

epoch 97: avg test  loss 885.63, bar  test loss 3.220, len  test loss 0.032, col  test loss 154.992


Epoch 98: 272batch [00:19, 14.20batch/s, loss=915]


epoch 98: avg train loss 874.87, bar train loss 3.136, len train loss 0.029, col train loss 153.141


Epoch 99: 2batch [00:00, 13.79batch/s, loss=893]

epoch 98: avg test  loss 884.90, bar  test loss 3.208, len  test loss 0.029, col  test loss 154.939


Epoch 99: 272batch [00:19, 13.92batch/s, loss=890]


epoch 99: avg train loss 874.27, bar train loss 3.125, len train loss 0.029, col train loss 153.046


Epoch 100: 2batch [00:00, 13.89batch/s, loss=858]

epoch 99: avg test  loss 884.70, bar  test loss 3.207, len  test loss 0.033, col  test loss 154.901


Epoch 100: 272batch [00:19, 14.17batch/s, loss=837]


epoch 100: avg train loss 873.59, bar train loss 3.111, len train loss 0.028, col train loss 152.946
epoch 100: avg test  loss 883.94, bar  test loss 3.200, len  test loss 0.030, col  test loss 154.767


Epoch 101: 272batch [00:19, 14.08batch/s, loss=882]


epoch 101: avg train loss 872.92, bar train loss 3.098, len train loss 0.029, col train loss 152.853


Epoch 102: 2batch [00:00, 14.29batch/s, loss=898]

epoch 101: avg test  loss 884.08, bar  test loss 3.156, len  test loss 0.029, col  test loss 154.770


Epoch 102: 272batch [00:19, 14.09batch/s, loss=978]


epoch 102: avg train loss 872.40, bar train loss 3.086, len train loss 0.029, col train loss 152.780


Epoch 103: 2batch [00:00, 13.79batch/s, loss=881]

epoch 102: avg test  loss 883.39, bar  test loss 3.164, len  test loss 0.030, col  test loss 154.707


Epoch 103: 272batch [00:19, 14.21batch/s, loss=946]


epoch 103: avg train loss 872.09, bar train loss 3.082, len train loss 0.029, col train loss 152.689


Epoch 104: 2batch [00:00, 14.08batch/s, loss=868]

epoch 103: avg test  loss 882.34, bar  test loss 3.145, len  test loss 0.029, col  test loss 154.548


Epoch 104: 272batch [00:19, 13.99batch/s, loss=806]


epoch 104: avg train loss 870.94, bar train loss 3.063, len train loss 0.028, col train loss 152.540


Epoch 105: 2batch [00:00, 14.08batch/s, loss=915]

epoch 104: avg test  loss 881.96, bar  test loss 3.130, len  test loss 0.028, col  test loss 154.436


Epoch 105: 272batch [00:18, 14.33batch/s, loss=915]


epoch 105: avg train loss 870.39, bar train loss 3.051, len train loss 0.029, col train loss 152.446
epoch 105: avg test  loss 881.36, bar  test loss 3.130, len  test loss 0.028, col  test loss 154.418


Epoch 106: 272batch [00:19, 14.27batch/s, loss=880]


epoch 106: avg train loss 869.76, bar train loss 3.038, len train loss 0.028, col train loss 152.355


Epoch 107: 2batch [00:00, 14.29batch/s, loss=866]

epoch 106: avg test  loss 881.18, bar  test loss 3.119, len  test loss 0.029, col  test loss 154.334


Epoch 107: 272batch [00:18, 14.32batch/s, loss=910]


epoch 107: avg train loss 869.19, bar train loss 3.029, len train loss 0.028, col train loss 152.288


Epoch 108: 2batch [00:00, 14.29batch/s, loss=894]

epoch 107: avg test  loss 881.24, bar  test loss 3.128, len  test loss 0.034, col  test loss 154.350


Epoch 108: 272batch [00:18, 14.37batch/s, loss=869]


epoch 108: avg train loss 868.65, bar train loss 3.014, len train loss 0.029, col train loss 152.182


Epoch 109: 2batch [00:00, 14.39batch/s, loss=861]

epoch 108: avg test  loss 879.83, bar  test loss 3.093, len  test loss 0.028, col  test loss 154.247


Epoch 109: 272batch [00:19, 14.27batch/s, loss=834]


epoch 109: avg train loss 867.93, bar train loss 3.004, len train loss 0.028, col train loss 152.092


Epoch 110: 2batch [00:00, 14.08batch/s, loss=860]

epoch 109: avg test  loss 879.98, bar  test loss 3.094, len  test loss 0.028, col  test loss 154.187


Epoch 110: 272batch [00:19, 14.31batch/s, loss=903]


epoch 110: avg train loss 867.66, bar train loss 2.997, len train loss 0.028, col train loss 152.030
epoch 110: avg test  loss 879.64, bar  test loss 3.074, len  test loss 0.031, col  test loss 154.127


Epoch 111: 272batch [00:19, 14.12batch/s, loss=833]


epoch 111: avg train loss 866.99, bar train loss 2.985, len train loss 0.028, col train loss 151.933


Epoch 112: 2batch [00:00, 13.51batch/s, loss=861]

epoch 111: avg test  loss 879.46, bar  test loss 3.084, len  test loss 0.033, col  test loss 154.008


Epoch 112: 272batch [00:19, 14.13batch/s, loss=859]


epoch 112: avg train loss 866.39, bar train loss 2.973, len train loss 0.028, col train loss 151.836


Epoch 113: 2batch [00:00, 14.39batch/s, loss=851]

epoch 112: avg test  loss 878.27, bar  test loss 3.060, len  test loss 0.028, col  test loss 153.994


Epoch 113: 272batch [00:19, 14.07batch/s, loss=857]


epoch 113: avg train loss 865.76, bar train loss 2.962, len train loss 0.029, col train loss 151.704


Epoch 114: 2batch [00:00, 14.49batch/s, loss=873]

epoch 113: avg test  loss 878.43, bar  test loss 3.046, len  test loss 0.030, col  test loss 153.851


Epoch 114: 272batch [00:18, 14.33batch/s, loss=921]


epoch 114: avg train loss 865.19, bar train loss 2.952, len train loss 0.028, col train loss 151.607


Epoch 115: 2batch [00:00, 14.18batch/s, loss=881]

epoch 114: avg test  loss 877.75, bar  test loss 3.055, len  test loss 0.029, col  test loss 153.957


Epoch 115: 272batch [00:19, 14.30batch/s, loss=827]


epoch 115: avg train loss 864.43, bar train loss 2.935, len train loss 0.028, col train loss 151.528
epoch 115: avg test  loss 877.87, bar  test loss 3.037, len  test loss 0.029, col  test loss 153.801


Epoch 116: 272batch [00:19, 14.20batch/s, loss=855]


epoch 116: avg train loss 864.13, bar train loss 2.933, len train loss 0.028, col train loss 151.450


Epoch 117: 2batch [00:00, 14.18batch/s, loss=839]

epoch 116: avg test  loss 876.84, bar  test loss 3.012, len  test loss 0.028, col  test loss 153.778


Epoch 117: 272batch [00:19, 14.31batch/s, loss=942]


epoch 117: avg train loss 863.42, bar train loss 2.918, len train loss 0.028, col train loss 151.347


Epoch 118: 2batch [00:00, 13.89batch/s, loss=850]

epoch 117: avg test  loss 876.58, bar  test loss 3.027, len  test loss 0.028, col  test loss 153.783


Epoch 118: 272batch [00:19, 14.31batch/s, loss=989]


epoch 118: avg train loss 862.91, bar train loss 2.913, len train loss 0.027, col train loss 151.267


Epoch 119: 2batch [00:00, 14.39batch/s, loss=861]

epoch 118: avg test  loss 876.82, bar  test loss 3.002, len  test loss 0.031, col  test loss 153.645


Epoch 119: 272batch [00:19, 14.27batch/s, loss=849]


epoch 119: avg train loss 862.50, bar train loss 2.902, len train loss 0.028, col train loss 151.173


Epoch 120: 2batch [00:00, 13.79batch/s, loss=830]

epoch 119: avg test  loss 875.79, bar  test loss 2.986, len  test loss 0.027, col  test loss 153.508


Epoch 120: 272batch [00:19, 14.31batch/s, loss=877]


epoch 120: avg train loss 862.16, bar train loss 2.892, len train loss 0.028, col train loss 151.128
epoch 120: avg test  loss 875.66, bar  test loss 2.971, len  test loss 0.029, col  test loss 153.531


Epoch 121: 272batch [00:19, 14.21batch/s, loss=870]


epoch 121: avg train loss 861.48, bar train loss 2.879, len train loss 0.028, col train loss 151.036


Epoch 122: 2batch [00:00, 14.18batch/s, loss=850]

epoch 121: avg test  loss 875.10, bar  test loss 2.969, len  test loss 0.029, col  test loss 153.460


Epoch 122: 272batch [00:19, 13.96batch/s, loss=900]


epoch 122: avg train loss 860.73, bar train loss 2.866, len train loss 0.027, col train loss 150.939


Epoch 123: 2batch [00:00, 14.49batch/s, loss=834]

epoch 122: avg test  loss 874.94, bar  test loss 2.983, len  test loss 0.028, col  test loss 153.378


Epoch 123: 272batch [00:19, 13.76batch/s, loss=812]


epoch 123: avg train loss 860.38, bar train loss 2.860, len train loss 0.028, col train loss 150.866


Epoch 124: 2batch [00:00, 13.99batch/s, loss=844]

epoch 123: avg test  loss 875.57, bar  test loss 2.975, len  test loss 0.037, col  test loss 153.386


Epoch 124: 272batch [00:19, 14.25batch/s, loss=873]


epoch 124: avg train loss 859.97, bar train loss 2.854, len train loss 0.028, col train loss 150.764


Epoch 125: 2batch [00:00, 14.60batch/s, loss=893]

epoch 124: avg test  loss 874.61, bar  test loss 2.954, len  test loss 0.032, col  test loss 153.282


Epoch 125: 272batch [00:18, 14.73batch/s, loss=929]


epoch 125: avg train loss 859.35, bar train loss 2.841, len train loss 0.028, col train loss 150.692
epoch 125: avg test  loss 874.08, bar  test loss 2.948, len  test loss 0.030, col  test loss 153.307


Epoch 126: 272batch [00:18, 14.63batch/s, loss=923]


epoch 126: avg train loss 858.75, bar train loss 2.833, len train loss 0.028, col train loss 150.584


Epoch 127: 2batch [00:00, 14.18batch/s, loss=864]

epoch 126: avg test  loss 873.84, bar  test loss 2.971, len  test loss 0.028, col  test loss 153.238


Epoch 127: 272batch [00:18, 14.39batch/s, loss=905]


epoch 127: avg train loss 858.20, bar train loss 2.820, len train loss 0.028, col train loss 150.509


Epoch 128: 2batch [00:00, 13.79batch/s, loss=871]

epoch 127: avg test  loss 873.24, bar  test loss 2.928, len  test loss 0.029, col  test loss 153.127


Epoch 128: 272batch [00:18, 14.53batch/s, loss=826]


epoch 128: avg train loss 857.92, bar train loss 2.816, len train loss 0.027, col train loss 150.469


Epoch 129: 2batch [00:00, 14.60batch/s, loss=876]

epoch 128: avg test  loss 872.88, bar  test loss 2.909, len  test loss 0.028, col  test loss 153.097


Epoch 129: 272batch [00:18, 14.72batch/s, loss=857]


epoch 129: avg train loss 857.44, bar train loss 2.810, len train loss 0.028, col train loss 150.357


Epoch 130: 2batch [00:00, 14.60batch/s, loss=867]

epoch 129: avg test  loss 872.64, bar  test loss 2.934, len  test loss 0.028, col  test loss 153.053


Epoch 130: 272batch [00:18, 14.72batch/s, loss=834]


epoch 130: avg train loss 856.89, bar train loss 2.798, len train loss 0.027, col train loss 150.275
epoch 130: avg test  loss 872.23, bar  test loss 2.895, len  test loss 0.027, col  test loss 153.051


Epoch 131: 272batch [00:18, 14.63batch/s, loss=832]


epoch 131: avg train loss 856.58, bar train loss 2.796, len train loss 0.028, col train loss 150.192


Epoch 132: 2batch [00:00, 14.29batch/s, loss=835]

epoch 131: avg test  loss 872.18, bar  test loss 2.871, len  test loss 0.030, col  test loss 152.928


Epoch 132: 272batch [00:18, 14.62batch/s, loss=819]


epoch 132: avg train loss 856.06, bar train loss 2.786, len train loss 0.027, col train loss 150.120


Epoch 133: 2batch [00:00, 14.60batch/s, loss=873]

epoch 132: avg test  loss 872.00, bar  test loss 2.884, len  test loss 0.028, col  test loss 152.908


Epoch 133: 272batch [00:18, 14.71batch/s, loss=891]


epoch 133: avg train loss 855.47, bar train loss 2.774, len train loss 0.027, col train loss 150.030


Epoch 134: 2batch [00:00, 14.60batch/s, loss=845]

epoch 133: avg test  loss 871.13, bar  test loss 2.886, len  test loss 0.028, col  test loss 152.748


Epoch 134: 272batch [00:18, 14.70batch/s, loss=809]


epoch 134: avg train loss 854.99, bar train loss 2.769, len train loss 0.028, col train loss 149.886


Epoch 135: 2batch [00:00, 14.81batch/s, loss=850]

epoch 134: avg test  loss 871.12, bar  test loss 2.882, len  test loss 0.030, col  test loss 152.706


Epoch 135: 272batch [00:18, 14.64batch/s, loss=843]


epoch 135: avg train loss 854.29, bar train loss 2.757, len train loss 0.028, col train loss 149.805
epoch 135: avg test  loss 870.99, bar  test loss 2.895, len  test loss 0.032, col  test loss 152.789


Epoch 136: 272batch [00:18, 14.68batch/s, loss=925]


epoch 136: avg train loss 853.61, bar train loss 2.749, len train loss 0.027, col train loss 149.687


Epoch 137: 2batch [00:00, 14.49batch/s, loss=838]

epoch 136: avg test  loss 870.01, bar  test loss 2.847, len  test loss 0.028, col  test loss 152.601


Epoch 137: 272batch [00:18, 14.76batch/s, loss=891]


epoch 137: avg train loss 853.03, bar train loss 2.740, len train loss 0.027, col train loss 149.579


Epoch 138: 2batch [00:00, 14.81batch/s, loss=855]

epoch 137: avg test  loss 869.51, bar  test loss 2.856, len  test loss 0.028, col  test loss 152.325


Epoch 138: 272batch [00:18, 14.68batch/s, loss=941]


epoch 138: avg train loss 852.51, bar train loss 2.736, len train loss 0.027, col train loss 149.442


Epoch 139: 2batch [00:00, 14.49batch/s, loss=861]

epoch 138: avg test  loss 869.17, bar  test loss 2.858, len  test loss 0.030, col  test loss 152.369


Epoch 139: 272batch [00:18, 14.73batch/s, loss=835]


epoch 139: avg train loss 851.98, bar train loss 2.727, len train loss 0.027, col train loss 149.348


Epoch 140: 2batch [00:00, 14.49batch/s, loss=867]

epoch 139: avg test  loss 868.66, bar  test loss 2.862, len  test loss 0.027, col  test loss 152.226


Epoch 140: 272batch [00:18, 14.69batch/s, loss=869]


epoch 140: avg train loss 851.42, bar train loss 2.722, len train loss 0.028, col train loss 149.239
epoch 140: avg test  loss 868.69, bar  test loss 2.855, len  test loss 0.027, col  test loss 152.345


Epoch 141: 272batch [00:18, 14.59batch/s, loss=871]


epoch 141: avg train loss 851.18, bar train loss 2.715, len train loss 0.027, col train loss 149.202


Epoch 142: 2batch [00:00, 14.71batch/s, loss=907]

epoch 141: avg test  loss 868.27, bar  test loss 2.818, len  test loss 0.027, col  test loss 152.112


Epoch 142: 272batch [00:18, 14.70batch/s, loss=825]


epoch 142: avg train loss 850.81, bar train loss 2.710, len train loss 0.027, col train loss 149.127


Epoch 143: 2batch [00:00, 14.71batch/s, loss=843]

epoch 142: avg test  loss 867.68, bar  test loss 2.851, len  test loss 0.029, col  test loss 152.175


Epoch 143: 272batch [00:18, 14.71batch/s, loss=906]


epoch 143: avg train loss 850.49, bar train loss 2.705, len train loss 0.027, col train loss 149.047


Epoch 144: 2batch [00:00, 14.60batch/s, loss=837]

epoch 143: avg test  loss 867.75, bar  test loss 2.822, len  test loss 0.027, col  test loss 152.065


Epoch 144: 272batch [00:18, 14.72batch/s, loss=895]


epoch 144: avg train loss 849.99, bar train loss 2.698, len train loss 0.027, col train loss 148.969


Epoch 145: 2batch [00:00, 14.93batch/s, loss=855]

epoch 144: avg test  loss 867.63, bar  test loss 2.815, len  test loss 0.028, col  test loss 152.021


Epoch 145: 272batch [00:18, 14.71batch/s, loss=882]


epoch 145: avg train loss 849.66, bar train loss 2.690, len train loss 0.028, col train loss 148.883
epoch 145: avg test  loss 867.19, bar  test loss 2.831, len  test loss 0.028, col  test loss 152.010


Epoch 146: 272batch [00:18, 14.57batch/s, loss=826]


epoch 146: avg train loss 849.14, bar train loss 2.680, len train loss 0.027, col train loss 148.800


Epoch 147: 2batch [00:00, 14.71batch/s, loss=853]

epoch 146: avg test  loss 867.07, bar  test loss 2.802, len  test loss 0.029, col  test loss 151.992


Epoch 147: 272batch [00:18, 14.71batch/s, loss=843]


epoch 147: avg train loss 848.85, bar train loss 2.678, len train loss 0.027, col train loss 148.730


Epoch 148: 2batch [00:00, 14.81batch/s, loss=838]

epoch 147: avg test  loss 867.04, bar  test loss 2.821, len  test loss 0.028, col  test loss 151.899


Epoch 148: 272batch [00:18, 14.72batch/s, loss=878]


epoch 148: avg train loss 848.26, bar train loss 2.669, len train loss 0.027, col train loss 148.642


Epoch 149: 2batch [00:00, 14.18batch/s, loss=865]

epoch 148: avg test  loss 866.89, bar  test loss 2.774, len  test loss 0.029, col  test loss 151.808


Epoch 149: 272batch [00:18, 14.70batch/s, loss=867]


epoch 149: avg train loss 847.63, bar train loss 2.666, len train loss 0.027, col train loss 148.497


Epoch 150: 2batch [00:00, 14.81batch/s, loss=802]

epoch 149: avg test  loss 865.56, bar  test loss 2.802, len  test loss 0.028, col  test loss 151.716


Epoch 150: 272batch [00:18, 14.70batch/s, loss=876]


epoch 150: avg train loss 847.38, bar train loss 2.660, len train loss 0.027, col train loss 148.427
epoch 150: avg test  loss 866.14, bar  test loss 2.795, len  test loss 0.029, col  test loss 151.697


Epoch 151: 272batch [00:18, 14.58batch/s, loss=894]


epoch 151: avg train loss 846.90, bar train loss 2.651, len train loss 0.027, col train loss 148.340


Epoch 152: 2batch [00:00, 14.60batch/s, loss=862]

epoch 151: avg test  loss 865.82, bar  test loss 2.756, len  test loss 0.029, col  test loss 151.625


Epoch 152: 272batch [00:18, 14.40batch/s, loss=813]


epoch 152: avg train loss 846.41, bar train loss 2.644, len train loss 0.027, col train loss 148.266


Epoch 153: 2batch [00:00, 14.49batch/s, loss=854]

epoch 152: avg test  loss 865.33, bar  test loss 2.747, len  test loss 0.027, col  test loss 151.475


Epoch 153: 272batch [00:18, 14.56batch/s, loss=802]


epoch 153: avg train loss 846.02, bar train loss 2.637, len train loss 0.027, col train loss 148.180


Epoch 154: 2batch [00:00, 14.50batch/s, loss=843]

epoch 153: avg test  loss 865.13, bar  test loss 2.753, len  test loss 0.028, col  test loss 151.527


Epoch 154: 272batch [00:18, 14.72batch/s, loss=814]


epoch 154: avg train loss 845.68, bar train loss 2.632, len train loss 0.027, col train loss 148.098


Epoch 155: 2batch [00:00, 14.93batch/s, loss=823]

epoch 154: avg test  loss 864.71, bar  test loss 2.765, len  test loss 0.028, col  test loss 151.414


Epoch 155: 272batch [00:19, 14.06batch/s, loss=872]


epoch 155: avg train loss 845.39, bar train loss 2.627, len train loss 0.027, col train loss 148.043
epoch 155: avg test  loss 864.83, bar  test loss 2.777, len  test loss 0.029, col  test loss 151.461


Epoch 156: 272batch [00:18, 14.33batch/s, loss=787]


epoch 156: avg train loss 844.66, bar train loss 2.617, len train loss 0.027, col train loss 147.945


Epoch 157: 2batch [00:00, 14.71batch/s, loss=848]

epoch 156: avg test  loss 864.40, bar  test loss 2.764, len  test loss 0.030, col  test loss 151.454


Epoch 157: 272batch [00:18, 14.62batch/s, loss=876]


epoch 157: avg train loss 844.50, bar train loss 2.619, len train loss 0.027, col train loss 147.889


Epoch 158: 2batch [00:00, 13.70batch/s, loss=820]

epoch 157: avg test  loss 863.98, bar  test loss 2.740, len  test loss 0.028, col  test loss 151.330


Epoch 158: 272batch [00:18, 14.43batch/s, loss=868]


epoch 158: avg train loss 844.05, bar train loss 2.609, len train loss 0.027, col train loss 147.789


Epoch 159: 2batch [00:00, 14.71batch/s, loss=852]

epoch 158: avg test  loss 863.71, bar  test loss 2.740, len  test loss 0.028, col  test loss 151.201


Epoch 159: 272batch [00:18, 14.66batch/s, loss=885]


epoch 159: avg train loss 843.60, bar train loss 2.600, len train loss 0.027, col train loss 147.720


Epoch 160: 2batch [00:00, 14.71batch/s, loss=864]

epoch 159: avg test  loss 863.70, bar  test loss 2.738, len  test loss 0.028, col  test loss 151.244


Epoch 160: 272batch [00:18, 14.66batch/s, loss=865]


epoch 160: avg train loss 843.31, bar train loss 2.594, len train loss 0.027, col train loss 147.660
epoch 160: avg test  loss 863.31, bar  test loss 2.763, len  test loss 0.028, col  test loss 151.193


Epoch 161: 272batch [00:18, 14.59batch/s, loss=845]


epoch 161: avg train loss 842.77, bar train loss 2.592, len train loss 0.026, col train loss 147.567


Epoch 162: 2batch [00:00, 14.71batch/s, loss=822]

epoch 161: avg test  loss 863.27, bar  test loss 2.711, len  test loss 0.030, col  test loss 151.117


Epoch 162: 272batch [00:18, 14.68batch/s, loss=790]


epoch 162: avg train loss 842.63, bar train loss 2.584, len train loss 0.026, col train loss 147.527


Epoch 163: 2batch [00:00, 14.71batch/s, loss=857]

epoch 162: avg test  loss 863.49, bar  test loss 2.767, len  test loss 0.032, col  test loss 151.119


Epoch 163: 272batch [00:18, 14.73batch/s, loss=812]


epoch 163: avg train loss 842.01, bar train loss 2.576, len train loss 0.027, col train loss 147.407


Epoch 164: 2batch [00:00, 14.18batch/s, loss=846]

epoch 163: avg test  loss 862.69, bar  test loss 2.751, len  test loss 0.028, col  test loss 151.115


Epoch 164: 272batch [00:18, 14.68batch/s, loss=792]


epoch 164: avg train loss 841.55, bar train loss 2.569, len train loss 0.027, col train loss 147.345


Epoch 165: 2batch [00:00, 14.81batch/s, loss=833]

epoch 164: avg test  loss 862.51, bar  test loss 2.689, len  test loss 0.027, col  test loss 150.940


Epoch 165: 272batch [00:18, 14.66batch/s, loss=822]


epoch 165: avg train loss 841.11, bar train loss 2.560, len train loss 0.026, col train loss 147.256
epoch 165: avg test  loss 862.36, bar  test loss 2.721, len  test loss 0.029, col  test loss 150.952


Epoch 166: 272batch [00:18, 14.59batch/s, loss=858]


epoch 166: avg train loss 840.41, bar train loss 2.555, len train loss 0.026, col train loss 147.140


Epoch 167: 2batch [00:00, 14.60batch/s, loss=805]

epoch 166: avg test  loss 861.23, bar  test loss 2.706, len  test loss 0.029, col  test loss 150.819


Epoch 167: 272batch [00:18, 14.63batch/s, loss=840]


epoch 167: avg train loss 839.86, bar train loss 2.546, len train loss 0.026, col train loss 147.015


Epoch 168: 2batch [00:00, 14.60batch/s, loss=840]

epoch 167: avg test  loss 861.29, bar  test loss 2.710, len  test loss 0.028, col  test loss 150.742


Epoch 168: 272batch [00:18, 14.66batch/s, loss=878]


epoch 168: avg train loss 839.40, bar train loss 2.543, len train loss 0.026, col train loss 146.925


Epoch 169: 2batch [00:00, 14.39batch/s, loss=847]

epoch 168: avg test  loss 861.15, bar  test loss 2.681, len  test loss 0.028, col  test loss 150.744


Epoch 169: 272batch [00:18, 14.72batch/s, loss=853]


epoch 169: avg train loss 839.01, bar train loss 2.531, len train loss 0.026, col train loss 146.873


Epoch 170: 2batch [00:00, 14.60batch/s, loss=818]

epoch 169: avg test  loss 860.42, bar  test loss 2.685, len  test loss 0.028, col  test loss 150.672


Epoch 170: 272batch [00:18, 14.62batch/s, loss=890]


epoch 170: avg train loss 838.44, bar train loss 2.523, len train loss 0.026, col train loss 146.778
epoch 170: avg test  loss 860.46, bar  test loss 2.689, len  test loss 0.029, col  test loss 150.700


Epoch 171: 272batch [00:18, 14.55batch/s, loss=941]


epoch 171: avg train loss 838.42, bar train loss 2.526, len train loss 0.027, col train loss 146.714


Epoch 172: 2batch [00:00, 14.49batch/s, loss=810]

epoch 171: avg test  loss 859.93, bar  test loss 2.657, len  test loss 0.027, col  test loss 150.550


Epoch 172: 272batch [00:18, 14.68batch/s, loss=832]


epoch 172: avg train loss 837.70, bar train loss 2.511, len train loss 0.026, col train loss 146.649


Epoch 173: 2batch [00:00, 14.93batch/s, loss=789]

epoch 172: avg test  loss 859.80, bar  test loss 2.657, len  test loss 0.029, col  test loss 150.503


Epoch 173: 272batch [00:18, 14.64batch/s, loss=878]


epoch 173: avg train loss 837.22, bar train loss 2.502, len train loss 0.026, col train loss 146.561


Epoch 174: 2batch [00:00, 14.49batch/s, loss=817]

epoch 173: avg test  loss 859.30, bar  test loss 2.660, len  test loss 0.027, col  test loss 150.522


Epoch 174: 272batch [00:18, 14.65batch/s, loss=881]


epoch 174: avg train loss 836.59, bar train loss 2.492, len train loss 0.025, col train loss 146.484


Epoch 175: 2batch [00:00, 14.60batch/s, loss=861]

epoch 174: avg test  loss 859.12, bar  test loss 2.653, len  test loss 0.028, col  test loss 150.432


Epoch 175: 272batch [00:18, 14.67batch/s, loss=866]


epoch 175: avg train loss 836.43, bar train loss 2.493, len train loss 0.026, col train loss 146.415
epoch 175: avg test  loss 858.76, bar  test loss 2.642, len  test loss 0.027, col  test loss 150.384


Epoch 176: 272batch [00:18, 14.44batch/s, loss=860]


epoch 176: avg train loss 835.69, bar train loss 2.482, len train loss 0.025, col train loss 146.311


Epoch 177: 2batch [00:00, 14.39batch/s, loss=831]

epoch 176: avg test  loss 858.75, bar  test loss 2.634, len  test loss 0.027, col  test loss 150.317


Epoch 177: 272batch [00:18, 14.71batch/s, loss=792]


epoch 177: avg train loss 835.26, bar train loss 2.476, len train loss 0.025, col train loss 146.229


Epoch 178: 2batch [00:00, 14.49batch/s, loss=796]

epoch 177: avg test  loss 858.30, bar  test loss 2.618, len  test loss 0.026, col  test loss 150.274


Epoch 178: 272batch [00:18, 14.40batch/s, loss=837]


epoch 178: avg train loss 834.89, bar train loss 2.468, len train loss 0.026, col train loss 146.165


Epoch 179: 2batch [00:00, 14.18batch/s, loss=809]

epoch 178: avg test  loss 857.55, bar  test loss 2.605, len  test loss 0.026, col  test loss 150.188


Epoch 179: 272batch [00:18, 14.35batch/s, loss=861]


epoch 179: avg train loss 834.35, bar train loss 2.456, len train loss 0.025, col train loss 146.091


Epoch 180: 2batch [00:00, 14.60batch/s, loss=797]

epoch 179: avg test  loss 857.60, bar  test loss 2.600, len  test loss 0.028, col  test loss 150.033


Epoch 180: 272batch [00:19, 14.31batch/s, loss=844]


epoch 180: avg train loss 833.87, bar train loss 2.452, len train loss 0.026, col train loss 146.011
epoch 180: avg test  loss 857.50, bar  test loss 2.592, len  test loss 0.030, col  test loss 150.134


Epoch 181: 272batch [00:19, 14.24batch/s, loss=837]


epoch 181: avg train loss 833.21, bar train loss 2.444, len train loss 0.025, col train loss 145.900


Epoch 182: 2batch [00:00, 14.29batch/s, loss=822]

epoch 181: avg test  loss 857.02, bar  test loss 2.625, len  test loss 0.027, col  test loss 150.109


Epoch 182: 272batch [00:18, 14.42batch/s, loss=863]


epoch 182: avg train loss 832.95, bar train loss 2.440, len train loss 0.025, col train loss 145.846


Epoch 183: 2batch [00:00, 14.71batch/s, loss=869]

epoch 182: avg test  loss 856.10, bar  test loss 2.591, len  test loss 0.026, col  test loss 150.060


Epoch 183: 272batch [00:18, 14.45batch/s, loss=820]


epoch 183: avg train loss 832.12, bar train loss 2.430, len train loss 0.026, col train loss 145.682


Epoch 184: 2batch [00:00, 14.60batch/s, loss=827]

epoch 183: avg test  loss 855.99, bar  test loss 2.592, len  test loss 0.026, col  test loss 149.905


Epoch 184: 272batch [00:18, 14.52batch/s, loss=839]


epoch 184: avg train loss 831.65, bar train loss 2.424, len train loss 0.026, col train loss 145.605


Epoch 185: 2batch [00:00, 14.49batch/s, loss=840]

epoch 184: avg test  loss 855.47, bar  test loss 2.571, len  test loss 0.027, col  test loss 149.750


Epoch 185: 272batch [00:18, 14.47batch/s, loss=818]


epoch 185: avg train loss 831.17, bar train loss 2.416, len train loss 0.025, col train loss 145.532
epoch 185: avg test  loss 855.29, bar  test loss 2.589, len  test loss 0.027, col  test loss 149.803


Epoch 186: 272batch [00:19, 14.20batch/s, loss=775]


epoch 186: avg train loss 830.69, bar train loss 2.410, len train loss 0.025, col train loss 145.441


Epoch 187: 2batch [00:00, 14.08batch/s, loss=847]

epoch 186: avg test  loss 854.77, bar  test loss 2.559, len  test loss 0.027, col  test loss 149.694


Epoch 187: 272batch [00:18, 14.51batch/s, loss=852]


epoch 187: avg train loss 830.17, bar train loss 2.401, len train loss 0.025, col train loss 145.386


Epoch 188: 2batch [00:00, 14.29batch/s, loss=804]

epoch 187: avg test  loss 854.90, bar  test loss 2.566, len  test loss 0.027, col  test loss 149.790


Epoch 188: 272batch [00:18, 14.49batch/s, loss=830]


epoch 188: avg train loss 829.76, bar train loss 2.398, len train loss 0.025, col train loss 145.289


Epoch 189: 2batch [00:00, 14.29batch/s, loss=864]

epoch 188: avg test  loss 854.27, bar  test loss 2.553, len  test loss 0.026, col  test loss 149.614


Epoch 189: 272batch [00:18, 14.51batch/s, loss=820]


epoch 189: avg train loss 829.28, bar train loss 2.388, len train loss 0.025, col train loss 145.220


Epoch 190: 2batch [00:00, 14.60batch/s, loss=856]

epoch 189: avg test  loss 853.90, bar  test loss 2.533, len  test loss 0.026, col  test loss 149.543


Epoch 190: 272batch [00:18, 14.48batch/s, loss=769]


epoch 190: avg train loss 828.88, bar train loss 2.386, len train loss 0.025, col train loss 145.134
epoch 190: avg test  loss 853.71, bar  test loss 2.577, len  test loss 0.028, col  test loss 149.657


Epoch 191: 272batch [00:18, 14.32batch/s, loss=817]


epoch 191: avg train loss 828.41, bar train loss 2.375, len train loss 0.025, col train loss 145.083


Epoch 192: 2batch [00:00, 13.89batch/s, loss=850]

epoch 191: avg test  loss 853.31, bar  test loss 2.538, len  test loss 0.028, col  test loss 149.436


Epoch 192: 272batch [00:18, 14.46batch/s, loss=775]


epoch 192: avg train loss 827.94, bar train loss 2.370, len train loss 0.025, col train loss 145.004


Epoch 193: 2batch [00:00, 14.71batch/s, loss=811]

epoch 192: avg test  loss 853.17, bar  test loss 2.539, len  test loss 0.027, col  test loss 149.498


Epoch 193: 272batch [00:18, 14.42batch/s, loss=866]


epoch 193: avg train loss 827.63, bar train loss 2.363, len train loss 0.025, col train loss 144.938


Epoch 194: 2batch [00:00, 14.60batch/s, loss=805]

epoch 193: avg test  loss 853.17, bar  test loss 2.513, len  test loss 0.026, col  test loss 149.457


Epoch 194: 272batch [00:18, 14.45batch/s, loss=964]


epoch 194: avg train loss 827.08, bar train loss 2.354, len train loss 0.025, col train loss 144.857


Epoch 195: 2batch [00:00, 14.29batch/s, loss=842]

epoch 194: avg test  loss 852.69, bar  test loss 2.537, len  test loss 0.030, col  test loss 149.405


Epoch 195: 272batch [00:18, 14.38batch/s, loss=787]


epoch 195: avg train loss 826.63, bar train loss 2.350, len train loss 0.025, col train loss 144.772
epoch 195: avg test  loss 852.39, bar  test loss 2.521, len  test loss 0.026, col  test loss 149.385


Epoch 196: 272batch [00:19, 14.29batch/s, loss=874]


epoch 196: avg train loss 826.22, bar train loss 2.344, len train loss 0.025, col train loss 144.720


Epoch 197: 2batch [00:00, 12.99batch/s, loss=807]

epoch 196: avg test  loss 852.15, bar  test loss 2.505, len  test loss 0.027, col  test loss 149.186


Epoch 197: 272batch [00:19, 14.22batch/s, loss=747]


epoch 197: avg train loss 825.78, bar train loss 2.340, len train loss 0.024, col train loss 144.622


Epoch 198: 2batch [00:00, 13.99batch/s, loss=809]

epoch 197: avg test  loss 851.56, bar  test loss 2.533, len  test loss 0.027, col  test loss 149.411


Epoch 198: 272batch [00:19, 14.26batch/s, loss=867]


epoch 198: avg train loss 825.36, bar train loss 2.332, len train loss 0.025, col train loss 144.560


Epoch 199: 2batch [00:00, 14.39batch/s, loss=805]

epoch 198: avg test  loss 851.67, bar  test loss 2.502, len  test loss 0.028, col  test loss 149.299


Epoch 199: 272batch [00:19, 14.30batch/s, loss=841]


epoch 199: avg train loss 825.01, bar train loss 2.330, len train loss 0.025, col train loss 144.481


Epoch 200: 2batch [00:00, 14.08batch/s, loss=822]

epoch 199: avg test  loss 851.47, bar  test loss 2.505, len  test loss 0.027, col  test loss 149.170


Epoch 200: 272batch [00:18, 14.48batch/s, loss=771]


epoch 200: avg train loss 824.60, bar train loss 2.325, len train loss 0.025, col train loss 144.404
epoch 200: avg test  loss 851.02, bar  test loss 2.488, len  test loss 0.027, col  test loss 149.113


Epoch 201: 272batch [00:19, 14.12batch/s, loss=849]


epoch 201: avg train loss 824.12, bar train loss 2.318, len train loss 0.025, col train loss 144.332


Epoch 202: 2batch [00:00, 14.60batch/s, loss=876]

epoch 201: avg test  loss 850.58, bar  test loss 2.492, len  test loss 0.025, col  test loss 149.053


Epoch 202: 272batch [00:18, 14.32batch/s, loss=741]


epoch 202: avg train loss 823.65, bar train loss 2.309, len train loss 0.025, col train loss 144.246


Epoch 203: 2batch [00:00, 14.49batch/s, loss=811]

epoch 202: avg test  loss 850.53, bar  test loss 2.482, len  test loss 0.029, col  test loss 149.092


Epoch 203: 272batch [00:18, 14.42batch/s, loss=778]


epoch 203: avg train loss 823.44, bar train loss 2.307, len train loss 0.024, col train loss 144.187


Epoch 204: 2batch [00:00, 14.08batch/s, loss=839]

epoch 203: avg test  loss 850.34, bar  test loss 2.501, len  test loss 0.026, col  test loss 148.987


Epoch 204: 272batch [00:18, 14.37batch/s, loss=903]


epoch 204: avg train loss 823.07, bar train loss 2.301, len train loss 0.025, col train loss 144.137


Epoch 205: 2batch [00:00, 14.29batch/s, loss=844]

epoch 204: avg test  loss 850.90, bar  test loss 2.463, len  test loss 0.029, col  test loss 148.957


Epoch 205: 272batch [00:18, 14.43batch/s, loss=831]


epoch 205: avg train loss 822.57, bar train loss 2.295, len train loss 0.024, col train loss 144.054
epoch 205: avg test  loss 850.06, bar  test loss 2.481, len  test loss 0.027, col  test loss 148.925


Epoch 206: 272batch [00:19, 14.22batch/s, loss=863]


epoch 206: avg train loss 822.24, bar train loss 2.295, len train loss 0.025, col train loss 143.992


Epoch 207: 2batch [00:00, 14.60batch/s, loss=822]

epoch 206: avg test  loss 850.09, bar  test loss 2.470, len  test loss 0.027, col  test loss 148.888


Epoch 207: 272batch [00:18, 14.39batch/s, loss=851]


epoch 207: avg train loss 821.88, bar train loss 2.287, len train loss 0.025, col train loss 143.921


Epoch 208: 2batch [00:00, 14.39batch/s, loss=822]

epoch 207: avg test  loss 849.77, bar  test loss 2.462, len  test loss 0.026, col  test loss 148.917


Epoch 208: 272batch [00:18, 14.43batch/s, loss=929]


epoch 208: avg train loss 821.47, bar train loss 2.282, len train loss 0.024, col train loss 143.857


Epoch 209: 2batch [00:00, 14.18batch/s, loss=812]

epoch 208: avg test  loss 849.69, bar  test loss 2.468, len  test loss 0.026, col  test loss 148.953


Epoch 209: 272batch [00:18, 14.42batch/s, loss=780]


epoch 209: avg train loss 821.08, bar train loss 2.278, len train loss 0.025, col train loss 143.774


Epoch 210: 2batch [00:00, 14.29batch/s, loss=832]

epoch 209: avg test  loss 849.11, bar  test loss 2.461, len  test loss 0.025, col  test loss 148.747


Epoch 210: 272batch [00:18, 14.50batch/s, loss=852]


epoch 210: avg train loss 820.65, bar train loss 2.272, len train loss 0.025, col train loss 143.701
epoch 210: avg test  loss 849.02, bar  test loss 2.450, len  test loss 0.025, col  test loss 148.795


Epoch 211: 272batch [00:19, 14.20batch/s, loss=828]


epoch 211: avg train loss 820.28, bar train loss 2.267, len train loss 0.025, col train loss 143.638


Epoch 212: 2batch [00:00, 14.49batch/s, loss=805]

epoch 211: avg test  loss 848.55, bar  test loss 2.467, len  test loss 0.026, col  test loss 148.716


Epoch 212: 272batch [00:18, 14.41batch/s, loss=845]


epoch 212: avg train loss 819.95, bar train loss 2.263, len train loss 0.024, col train loss 143.572


Epoch 213: 2batch [00:00, 14.49batch/s, loss=839]

epoch 212: avg test  loss 849.02, bar  test loss 2.455, len  test loss 0.028, col  test loss 148.720


Epoch 213: 272batch [00:18, 14.35batch/s, loss=822]


epoch 213: avg train loss 819.53, bar train loss 2.259, len train loss 0.024, col train loss 143.505


Epoch 214: 2batch [00:00, 14.29batch/s, loss=814]

epoch 213: avg test  loss 848.62, bar  test loss 2.451, len  test loss 0.028, col  test loss 148.739


Epoch 214: 272batch [00:18, 14.42batch/s, loss=858]


epoch 214: avg train loss 819.48, bar train loss 2.258, len train loss 0.025, col train loss 143.475


Epoch 215: 2batch [00:00, 14.18batch/s, loss=793]

epoch 214: avg test  loss 848.35, bar  test loss 2.440, len  test loss 0.026, col  test loss 148.528


Epoch 215: 272batch [00:18, 14.40batch/s, loss=875]


epoch 215: avg train loss 818.87, bar train loss 2.246, len train loss 0.024, col train loss 143.369
epoch 215: avg test  loss 848.61, bar  test loss 2.441, len  test loss 0.027, col  test loss 148.506


Epoch 216: 272batch [00:19, 14.15batch/s, loss=782]


epoch 216: avg train loss 818.68, bar train loss 2.245, len train loss 0.024, col train loss 143.334


Epoch 217: 2batch [00:00, 14.39batch/s, loss=818]

epoch 216: avg test  loss 848.10, bar  test loss 2.446, len  test loss 0.026, col  test loss 148.515


Epoch 217: 272batch [00:18, 14.42batch/s, loss=840]


epoch 217: avg train loss 818.04, bar train loss 2.241, len train loss 0.024, col train loss 143.224


Epoch 218: 2batch [00:00, 14.60batch/s, loss=792]

epoch 217: avg test  loss 847.84, bar  test loss 2.432, len  test loss 0.026, col  test loss 148.412


Epoch 218: 272batch [00:18, 14.43batch/s, loss=804]


epoch 218: avg train loss 817.94, bar train loss 2.237, len train loss 0.024, col train loss 143.194


Epoch 219: 2batch [00:00, 14.29batch/s, loss=832]

epoch 218: avg test  loss 847.80, bar  test loss 2.429, len  test loss 0.026, col  test loss 148.403


Epoch 219: 272batch [00:18, 14.40batch/s, loss=791]


epoch 219: avg train loss 817.43, bar train loss 2.232, len train loss 0.024, col train loss 143.111


Epoch 220: 2batch [00:00, 14.71batch/s, loss=806]

epoch 219: avg test  loss 847.39, bar  test loss 2.431, len  test loss 0.027, col  test loss 148.487


Epoch 220: 272batch [00:18, 14.45batch/s, loss=834]


epoch 220: avg train loss 817.11, bar train loss 2.228, len train loss 0.024, col train loss 143.047
epoch 220: avg test  loss 847.69, bar  test loss 2.429, len  test loss 0.026, col  test loss 148.434


Epoch 221: 272batch [00:19, 14.14batch/s, loss=852]


epoch 221: avg train loss 816.74, bar train loss 2.225, len train loss 0.024, col train loss 142.976
epoch 221: avg test  loss 847.08, bar  test loss 2.416, len  test loss 0.025, col  test loss 148.364


Epoch 222: 272batch [00:18, 14.40batch/s, loss=756]


epoch 222: avg train loss 816.37, bar train loss 2.220, len train loss 0.024, col train loss 142.902


Epoch 223: 2batch [00:00, 14.29batch/s, loss=836]

epoch 222: avg test  loss 847.16, bar  test loss 2.424, len  test loss 0.026, col  test loss 148.324


Epoch 223: 272batch [00:19, 14.17batch/s, loss=757]


epoch 223: avg train loss 816.19, bar train loss 2.215, len train loss 0.024, col train loss 142.876


Epoch 224: 2batch [00:00, 14.29batch/s, loss=786]

epoch 223: avg test  loss 846.73, bar  test loss 2.426, len  test loss 0.026, col  test loss 148.244


Epoch 224: 272batch [00:18, 14.34batch/s, loss=779]


epoch 224: avg train loss 815.93, bar train loss 2.213, len train loss 0.024, col train loss 142.803


Epoch 225: 2batch [00:00, 14.39batch/s, loss=807]

epoch 224: avg test  loss 846.70, bar  test loss 2.432, len  test loss 0.026, col  test loss 148.237


Epoch 225: 272batch [00:19, 14.28batch/s, loss=840]


epoch 225: avg train loss 815.54, bar train loss 2.208, len train loss 0.024, col train loss 142.738
epoch 225: avg test  loss 846.39, bar  test loss 2.399, len  test loss 0.026, col  test loss 148.224


Epoch 226: 272batch [00:19, 14.20batch/s, loss=798]


epoch 226: avg train loss 815.20, bar train loss 2.201, len train loss 0.024, col train loss 142.670


Epoch 227: 2batch [00:00, 14.39batch/s, loss=802]

epoch 226: avg test  loss 846.44, bar  test loss 2.405, len  test loss 0.026, col  test loss 148.265


Epoch 227: 272batch [00:18, 14.38batch/s, loss=796]


epoch 227: avg train loss 814.99, bar train loss 2.197, len train loss 0.025, col train loss 142.637


Epoch 228: 2batch [00:00, 14.49batch/s, loss=801]

epoch 227: avg test  loss 846.11, bar  test loss 2.406, len  test loss 0.026, col  test loss 148.194


Epoch 228: 272batch [00:18, 14.37batch/s, loss=884]


epoch 228: avg train loss 814.60, bar train loss 2.193, len train loss 0.024, col train loss 142.575


Epoch 229: 2batch [00:00, 14.49batch/s, loss=822]

epoch 228: avg test  loss 845.65, bar  test loss 2.393, len  test loss 0.026, col  test loss 148.136


Epoch 229: 272batch [00:18, 14.38batch/s, loss=883]


epoch 229: avg train loss 814.14, bar train loss 2.189, len train loss 0.024, col train loss 142.488


Epoch 230: 2batch [00:00, 14.60batch/s, loss=819]

epoch 229: avg test  loss 846.32, bar  test loss 2.379, len  test loss 0.027, col  test loss 148.095


Epoch 230: 272batch [00:18, 14.37batch/s, loss=809]


epoch 230: avg train loss 814.04, bar train loss 2.186, len train loss 0.025, col train loss 142.449
epoch 230: avg test  loss 845.67, bar  test loss 2.390, len  test loss 0.029, col  test loss 148.079


Epoch 231: 272batch [00:19, 13.90batch/s, loss=846]


epoch 231: avg train loss 813.53, bar train loss 2.181, len train loss 0.024, col train loss 142.366


Epoch 232: 2batch [00:00, 14.49batch/s, loss=806]

epoch 231: avg test  loss 845.35, bar  test loss 2.387, len  test loss 0.025, col  test loss 148.202


Epoch 232: 272batch [00:18, 14.32batch/s, loss=805]


epoch 232: avg train loss 813.25, bar train loss 2.173, len train loss 0.024, col train loss 142.339


Epoch 233: 2batch [00:00, 14.49batch/s, loss=797]

epoch 232: avg test  loss 845.69, bar  test loss 2.392, len  test loss 0.029, col  test loss 148.095


Epoch 233: 272batch [00:19, 14.30batch/s, loss=763]


epoch 233: avg train loss 812.80, bar train loss 2.173, len train loss 0.024, col train loss 142.236


Epoch 234: 2batch [00:00, 14.29batch/s, loss=812]

epoch 233: avg test  loss 845.43, bar  test loss 2.395, len  test loss 0.027, col  test loss 147.956


Epoch 234: 272batch [00:19, 14.30batch/s, loss=798]


epoch 234: avg train loss 812.44, bar train loss 2.168, len train loss 0.024, col train loss 142.159


Epoch 235: 2batch [00:00, 14.39batch/s, loss=801]

epoch 234: avg test  loss 844.82, bar  test loss 2.374, len  test loss 0.025, col  test loss 148.025


Epoch 235: 272batch [00:19, 14.31batch/s, loss=801]


epoch 235: avg train loss 812.38, bar train loss 2.164, len train loss 0.024, col train loss 142.125
epoch 235: avg test  loss 845.34, bar  test loss 2.365, len  test loss 0.026, col  test loss 147.984


Epoch 236: 272batch [00:19, 14.17batch/s, loss=800]


epoch 236: avg train loss 811.83, bar train loss 2.159, len train loss 0.024, col train loss 142.068


Epoch 237: 2batch [00:00, 13.79batch/s, loss=814]

epoch 236: avg test  loss 844.83, bar  test loss 2.374, len  test loss 0.026, col  test loss 147.934


Epoch 237: 272batch [00:18, 14.37batch/s, loss=806]


epoch 237: avg train loss 811.50, bar train loss 2.156, len train loss 0.024, col train loss 142.007


Epoch 238: 2batch [00:00, 14.08batch/s, loss=802]

epoch 237: avg test  loss 844.71, bar  test loss 2.365, len  test loss 0.026, col  test loss 147.917


Epoch 238: 272batch [00:18, 14.55batch/s, loss=791]


epoch 238: avg train loss 811.35, bar train loss 2.156, len train loss 0.024, col train loss 141.942


Epoch 239: 2batch [00:00, 14.18batch/s, loss=820]

epoch 238: avg test  loss 844.76, bar  test loss 2.357, len  test loss 0.026, col  test loss 147.795


Epoch 239: 272batch [00:18, 14.54batch/s, loss=804]


epoch 239: avg train loss 811.05, bar train loss 2.152, len train loss 0.024, col train loss 141.880


Epoch 240: 2batch [00:00, 14.29batch/s, loss=804]

epoch 239: avg test  loss 844.29, bar  test loss 2.360, len  test loss 0.025, col  test loss 147.829


Epoch 240: 272batch [00:18, 14.54batch/s, loss=803]


epoch 240: avg train loss 810.72, bar train loss 2.147, len train loss 0.024, col train loss 141.838
epoch 240: avg test  loss 844.62, bar  test loss 2.356, len  test loss 0.027, col  test loss 147.819


Epoch 241: 272batch [00:18, 14.37batch/s, loss=834]


epoch 241: avg train loss 810.38, bar train loss 2.144, len train loss 0.024, col train loss 141.771


Epoch 242: 2batch [00:00, 14.08batch/s, loss=802]

epoch 241: avg test  loss 844.43, bar  test loss 2.349, len  test loss 0.027, col  test loss 147.791


Epoch 242: 272batch [00:18, 14.56batch/s, loss=756]


epoch 242: avg train loss 809.98, bar train loss 2.141, len train loss 0.024, col train loss 141.681


Epoch 243: 2batch [00:00, 14.60batch/s, loss=817]

epoch 242: avg test  loss 844.18, bar  test loss 2.360, len  test loss 0.027, col  test loss 147.763


Epoch 243: 272batch [00:18, 14.53batch/s, loss=800]


epoch 243: avg train loss 809.79, bar train loss 2.135, len train loss 0.024, col train loss 141.650


Epoch 244: 2batch [00:00, 14.39batch/s, loss=841]

epoch 243: avg test  loss 843.93, bar  test loss 2.356, len  test loss 0.026, col  test loss 147.737


Epoch 244: 272batch [00:18, 14.51batch/s, loss=824]


epoch 244: avg train loss 809.34, bar train loss 2.132, len train loss 0.024, col train loss 141.562


Epoch 245: 2batch [00:00, 14.39batch/s, loss=839]

epoch 244: avg test  loss 844.02, bar  test loss 2.348, len  test loss 0.026, col  test loss 147.685


Epoch 245: 272batch [00:18, 14.48batch/s, loss=765]


epoch 245: avg train loss 809.34, bar train loss 2.129, len train loss 0.024, col train loss 141.548
epoch 245: avg test  loss 843.55, bar  test loss 2.338, len  test loss 0.026, col  test loss 147.602


Epoch 246: 272batch [00:19, 14.28batch/s, loss=789]


epoch 246: avg train loss 808.96, bar train loss 2.123, len train loss 0.023, col train loss 141.500


Epoch 247: 2batch [00:00, 14.29batch/s, loss=799]

epoch 246: avg test  loss 843.44, bar  test loss 2.341, len  test loss 0.026, col  test loss 147.655


Epoch 247: 272batch [00:18, 14.46batch/s, loss=768]


epoch 247: avg train loss 808.76, bar train loss 2.123, len train loss 0.023, col train loss 141.441


Epoch 248: 2batch [00:00, 14.60batch/s, loss=803]

epoch 247: avg test  loss 843.55, bar  test loss 2.339, len  test loss 0.026, col  test loss 147.697


Epoch 248: 272batch [00:18, 14.46batch/s, loss=965]


epoch 248: avg train loss 808.15, bar train loss 2.117, len train loss 0.024, col train loss 141.352


Epoch 249: 2batch [00:00, 14.18batch/s, loss=828]

epoch 248: avg test  loss 843.33, bar  test loss 2.337, len  test loss 0.026, col  test loss 147.615


Epoch 249: 272batch [00:18, 14.45batch/s, loss=770]


epoch 249: avg train loss 807.94, bar train loss 2.114, len train loss 0.024, col train loss 141.308


Epoch 250: 2batch [00:00, 14.29batch/s, loss=820]

epoch 249: avg test  loss 843.14, bar  test loss 2.328, len  test loss 0.026, col  test loss 147.569


Epoch 250: 272batch [00:18, 14.47batch/s, loss=762]


epoch 250: avg train loss 807.77, bar train loss 2.110, len train loss 0.024, col train loss 141.257
epoch 250: avg test  loss 843.51, bar  test loss 2.335, len  test loss 0.028, col  test loss 147.518


Epoch 251: 272batch [00:18, 14.33batch/s, loss=807]


epoch 251: avg train loss 807.42, bar train loss 2.108, len train loss 0.024, col train loss 141.181


Epoch 252: 2batch [00:00, 14.29batch/s, loss=774]

epoch 251: avg test  loss 842.97, bar  test loss 2.327, len  test loss 0.027, col  test loss 147.476


Epoch 252: 272batch [00:18, 14.46batch/s, loss=824]


epoch 252: avg train loss 807.01, bar train loss 2.100, len train loss 0.024, col train loss 141.125


Epoch 253: 2batch [00:00, 14.49batch/s, loss=827]

epoch 252: avg test  loss 842.85, bar  test loss 2.322, len  test loss 0.026, col  test loss 147.501


Epoch 253: 272batch [00:18, 14.44batch/s, loss=809]


epoch 253: avg train loss 806.83, bar train loss 2.097, len train loss 0.024, col train loss 141.079


Epoch 254: 2batch [00:00, 14.29batch/s, loss=798]

epoch 253: avg test  loss 842.71, bar  test loss 2.329, len  test loss 0.026, col  test loss 147.479


Epoch 254: 272batch [00:18, 14.46batch/s, loss=822]


epoch 254: avg train loss 806.54, bar train loss 2.097, len train loss 0.023, col train loss 141.033


Epoch 255: 2batch [00:00, 13.89batch/s, loss=794]

epoch 254: avg test  loss 842.28, bar  test loss 2.318, len  test loss 0.026, col  test loss 147.381


Epoch 255: 272batch [00:18, 14.46batch/s, loss=772]


epoch 255: avg train loss 806.24, bar train loss 2.090, len train loss 0.024, col train loss 140.975
epoch 255: avg test  loss 842.26, bar  test loss 2.344, len  test loss 0.027, col  test loss 147.434


Epoch 256: 272batch [00:19, 14.24batch/s, loss=844]


epoch 256: avg train loss 805.86, bar train loss 2.086, len train loss 0.023, col train loss 140.931


Epoch 257: 2batch [00:00, 14.93batch/s, loss=777]

epoch 256: avg test  loss 842.23, bar  test loss 2.329, len  test loss 0.026, col  test loss 147.390


Epoch 257: 272batch [00:18, 14.46batch/s, loss=754]


epoch 257: avg train loss 805.62, bar train loss 2.085, len train loss 0.023, col train loss 140.839


Epoch 258: 2batch [00:00, 14.60batch/s, loss=792]

epoch 257: avg test  loss 842.40, bar  test loss 2.315, len  test loss 0.028, col  test loss 147.437


Epoch 258: 272batch [00:18, 14.48batch/s, loss=855]


epoch 258: avg train loss 805.43, bar train loss 2.082, len train loss 0.024, col train loss 140.819


Epoch 259: 2batch [00:00, 14.29batch/s, loss=803]

epoch 258: avg test  loss 842.11, bar  test loss 2.317, len  test loss 0.026, col  test loss 147.349


Epoch 259: 272batch [00:18, 14.49batch/s, loss=839]


epoch 259: avg train loss 805.20, bar train loss 2.080, len train loss 0.024, col train loss 140.759


Epoch 260: 2batch [00:00, 14.60batch/s, loss=805]

epoch 259: avg test  loss 842.37, bar  test loss 2.307, len  test loss 0.026, col  test loss 147.401


Epoch 260: 272batch [00:18, 14.45batch/s, loss=791]


epoch 260: avg train loss 804.65, bar train loss 2.073, len train loss 0.023, col train loss 140.664
epoch 260: avg test  loss 841.98, bar  test loss 2.299, len  test loss 0.026, col  test loss 147.254


Epoch 261: 272batch [00:19, 14.25batch/s, loss=835]


epoch 261: avg train loss 804.47, bar train loss 2.071, len train loss 0.023, col train loss 140.633


Epoch 262: 2batch [00:00, 14.29batch/s, loss=797]

epoch 261: avg test  loss 841.97, bar  test loss 2.322, len  test loss 0.027, col  test loss 147.313


Epoch 262: 272batch [00:18, 14.45batch/s, loss=878]


epoch 262: avg train loss 804.10, bar train loss 2.066, len train loss 0.023, col train loss 140.581


Epoch 263: 2batch [00:00, 14.39batch/s, loss=791]

epoch 262: avg test  loss 842.10, bar  test loss 2.300, len  test loss 0.027, col  test loss 147.352


Epoch 263: 272batch [00:18, 14.43batch/s, loss=846]


epoch 263: avg train loss 803.92, bar train loss 2.066, len train loss 0.023, col train loss 140.523


Epoch 264: 2batch [00:00, 14.49batch/s, loss=836]

epoch 263: avg test  loss 841.33, bar  test loss 2.322, len  test loss 0.026, col  test loss 147.306


Epoch 264: 272batch [00:18, 14.40batch/s, loss=854]


epoch 264: avg train loss 803.50, bar train loss 2.061, len train loss 0.023, col train loss 140.446


Epoch 265: 2batch [00:00, 14.29batch/s, loss=786]

epoch 264: avg test  loss 841.82, bar  test loss 2.286, len  test loss 0.026, col  test loss 147.226


Epoch 265: 272batch [00:18, 14.42batch/s, loss=838]


epoch 265: avg train loss 803.33, bar train loss 2.056, len train loss 0.023, col train loss 140.406
epoch 265: avg test  loss 841.56, bar  test loss 2.288, len  test loss 0.026, col  test loss 147.174


Epoch 266: 272batch [00:19, 14.22batch/s, loss=862]


epoch 266: avg train loss 803.00, bar train loss 2.051, len train loss 0.023, col train loss 140.357


Epoch 267: 2batch [00:00, 14.49batch/s, loss=801]

epoch 266: avg test  loss 841.86, bar  test loss 2.286, len  test loss 0.029, col  test loss 147.191


Epoch 267: 272batch [00:18, 14.40batch/s, loss=762]


epoch 267: avg train loss 802.73, bar train loss 2.048, len train loss 0.023, col train loss 140.297


Epoch 268: 2batch [00:00, 14.29batch/s, loss=796]

epoch 267: avg test  loss 841.25, bar  test loss 2.295, len  test loss 0.025, col  test loss 147.173


Epoch 268: 272batch [00:18, 14.38batch/s, loss=829]


epoch 268: avg train loss 802.53, bar train loss 2.047, len train loss 0.023, col train loss 140.252


Epoch 269: 2batch [00:00, 14.08batch/s, loss=784]

epoch 268: avg test  loss 841.08, bar  test loss 2.281, len  test loss 0.026, col  test loss 147.117


Epoch 269: 272batch [00:18, 14.42batch/s, loss=794]


epoch 269: avg train loss 802.16, bar train loss 2.043, len train loss 0.023, col train loss 140.195


Epoch 270: 2batch [00:00, 14.29batch/s, loss=795]

epoch 269: avg test  loss 840.78, bar  test loss 2.283, len  test loss 0.027, col  test loss 147.173


Epoch 270: 272batch [00:18, 14.38batch/s, loss=821]


epoch 270: avg train loss 801.99, bar train loss 2.040, len train loss 0.023, col train loss 140.156
epoch 270: avg test  loss 841.02, bar  test loss 2.274, len  test loss 0.025, col  test loss 147.001


Epoch 271: 272batch [00:19, 14.21batch/s, loss=783]


epoch 271: avg train loss 801.48, bar train loss 2.036, len train loss 0.023, col train loss 140.074


Epoch 272: 2batch [00:00, 14.49batch/s, loss=776]

epoch 271: avg test  loss 840.88, bar  test loss 2.290, len  test loss 0.025, col  test loss 147.098


Epoch 272: 272batch [00:18, 14.41batch/s, loss=820]


epoch 272: avg train loss 801.39, bar train loss 2.032, len train loss 0.023, col train loss 140.041


Epoch 273: 2batch [00:00, 14.39batch/s, loss=824]

epoch 272: avg test  loss 840.63, bar  test loss 2.270, len  test loss 0.027, col  test loss 147.049


Epoch 273: 272batch [00:18, 14.41batch/s, loss=873]


epoch 273: avg train loss 801.03, bar train loss 2.033, len train loss 0.023, col train loss 139.965


Epoch 274: 2batch [00:00, 14.60batch/s, loss=807]

epoch 273: avg test  loss 839.92, bar  test loss 2.269, len  test loss 0.025, col  test loss 147.022


Epoch 274: 272batch [00:18, 14.42batch/s, loss=795]


epoch 274: avg train loss 800.71, bar train loss 2.026, len train loss 0.023, col train loss 139.908


Epoch 275: 2batch [00:00, 14.18batch/s, loss=826]

epoch 274: avg test  loss 839.92, bar  test loss 2.290, len  test loss 0.026, col  test loss 147.060


Epoch 275: 272batch [00:18, 14.41batch/s, loss=887]


epoch 275: avg train loss 800.55, bar train loss 2.025, len train loss 0.023, col train loss 139.884
epoch 275: avg test  loss 840.35, bar  test loss 2.268, len  test loss 0.026, col  test loss 146.947


Epoch 276: 272batch [00:19, 14.19batch/s, loss=835]


epoch 276: avg train loss 800.36, bar train loss 2.022, len train loss 0.023, col train loss 139.847


Epoch 277: 2batch [00:00, 14.29batch/s, loss=800]

epoch 276: avg test  loss 840.21, bar  test loss 2.246, len  test loss 0.025, col  test loss 146.898


Epoch 277: 272batch [00:18, 14.40batch/s, loss=825]


epoch 277: avg train loss 800.05, bar train loss 2.018, len train loss 0.023, col train loss 139.794


Epoch 278: 2batch [00:00, 14.18batch/s, loss=790]

epoch 277: avg test  loss 840.57, bar  test loss 2.269, len  test loss 0.026, col  test loss 146.913


Epoch 278: 272batch [00:18, 14.40batch/s, loss=800]


epoch 278: avg train loss 799.70, bar train loss 2.014, len train loss 0.023, col train loss 139.720


Epoch 279: 2batch [00:00, 14.18batch/s, loss=830]

epoch 278: avg test  loss 840.15, bar  test loss 2.267, len  test loss 0.027, col  test loss 146.842


Epoch 279: 272batch [00:18, 14.39batch/s, loss=802]


epoch 279: avg train loss 799.53, bar train loss 2.013, len train loss 0.023, col train loss 139.681


Epoch 280: 2batch [00:00, 13.79batch/s, loss=816]

epoch 279: avg test  loss 839.84, bar  test loss 2.261, len  test loss 0.025, col  test loss 146.960


Epoch 280: 272batch [00:18, 14.35batch/s, loss=795]


epoch 280: avg train loss 799.12, bar train loss 2.008, len train loss 0.023, col train loss 139.611
epoch 280: avg test  loss 840.36, bar  test loss 2.239, len  test loss 0.026, col  test loss 146.866


Epoch 281: 272batch [00:19, 14.18batch/s, loss=763]


epoch 281: avg train loss 798.98, bar train loss 2.004, len train loss 0.023, col train loss 139.562


Epoch 282: 2batch [00:00, 14.18batch/s, loss=783]

epoch 281: avg test  loss 839.80, bar  test loss 2.266, len  test loss 0.025, col  test loss 146.835


Epoch 282: 272batch [00:18, 14.36batch/s, loss=765]


epoch 282: avg train loss 798.42, bar train loss 2.003, len train loss 0.023, col train loss 139.479


Epoch 283: 2batch [00:00, 14.29batch/s, loss=793]

epoch 282: avg test  loss 840.33, bar  test loss 2.260, len  test loss 0.025, col  test loss 146.822


Epoch 283: 272batch [00:18, 14.39batch/s, loss=776]


epoch 283: avg train loss 798.29, bar train loss 1.999, len train loss 0.023, col train loss 139.447


Epoch 284: 2batch [00:00, 13.99batch/s, loss=787]

epoch 283: avg test  loss 839.44, bar  test loss 2.270, len  test loss 0.026, col  test loss 146.833


Epoch 284: 272batch [00:18, 14.37batch/s, loss=788]


epoch 284: avg train loss 798.04, bar train loss 1.995, len train loss 0.023, col train loss 139.399


Epoch 285: 2batch [00:00, 14.39batch/s, loss=776]

epoch 284: avg test  loss 840.38, bar  test loss 2.270, len  test loss 0.034, col  test loss 146.895


Epoch 285: 272batch [00:18, 14.36batch/s, loss=751]


epoch 285: avg train loss 797.93, bar train loss 1.995, len train loss 0.023, col train loss 139.386
epoch 285: avg test  loss 839.95, bar  test loss 2.252, len  test loss 0.025, col  test loss 146.806


Epoch 286: 272batch [00:19, 14.13batch/s, loss=878]


epoch 286: avg train loss 797.48, bar train loss 1.991, len train loss 0.023, col train loss 139.291


Epoch 287: 2batch [00:00, 14.29batch/s, loss=776]

epoch 286: avg test  loss 839.93, bar  test loss 2.263, len  test loss 0.026, col  test loss 146.832


Epoch 287: 272batch [00:18, 14.38batch/s, loss=807]


epoch 287: avg train loss 797.14, bar train loss 1.986, len train loss 0.022, col train loss 139.246


Epoch 288: 2batch [00:00, 13.99batch/s, loss=801]

epoch 287: avg test  loss 839.58, bar  test loss 2.243, len  test loss 0.026, col  test loss 146.743


Epoch 288: 272batch [00:18, 14.36batch/s, loss=836]


epoch 288: avg train loss 797.08, bar train loss 1.986, len train loss 0.023, col train loss 139.191


Epoch 289: 2batch [00:00, 14.39batch/s, loss=802]

epoch 288: avg test  loss 839.20, bar  test loss 2.246, len  test loss 0.026, col  test loss 146.774


Epoch 289: 272batch [00:18, 14.37batch/s, loss=811]


epoch 289: avg train loss 796.91, bar train loss 1.981, len train loss 0.023, col train loss 139.171


Epoch 290: 2batch [00:00, 14.39batch/s, loss=801]

epoch 289: avg test  loss 839.26, bar  test loss 2.229, len  test loss 0.026, col  test loss 146.650


Epoch 290: 272batch [00:18, 14.36batch/s, loss=777]


epoch 290: avg train loss 796.57, bar train loss 1.979, len train loss 0.023, col train loss 139.112
epoch 290: avg test  loss 838.94, bar  test loss 2.243, len  test loss 0.026, col  test loss 146.749


Epoch 291: 272batch [00:19, 14.05batch/s, loss=860]


epoch 291: avg train loss 796.43, bar train loss 1.979, len train loss 0.023, col train loss 139.062


Epoch 292: 2batch [00:00, 14.08batch/s, loss=746]

epoch 291: avg test  loss 839.03, bar  test loss 2.242, len  test loss 0.025, col  test loss 146.698


Epoch 292: 272batch [00:18, 14.34batch/s, loss=855]


epoch 292: avg train loss 796.14, bar train loss 1.975, len train loss 0.023, col train loss 139.015


Epoch 293: 2batch [00:00, 13.89batch/s, loss=782]

epoch 292: avg test  loss 839.12, bar  test loss 2.241, len  test loss 0.028, col  test loss 146.666


Epoch 293: 272batch [00:18, 14.39batch/s, loss=852]


epoch 293: avg train loss 795.94, bar train loss 1.967, len train loss 0.023, col train loss 138.988


Epoch 294: 2batch [00:00, 14.29batch/s, loss=798]

epoch 293: avg test  loss 839.00, bar  test loss 2.229, len  test loss 0.026, col  test loss 146.585


Epoch 294: 272batch [00:18, 14.34batch/s, loss=846]


epoch 294: avg train loss 795.59, bar train loss 1.968, len train loss 0.023, col train loss 138.905


Epoch 295: 2batch [00:00, 14.29batch/s, loss=779]

epoch 294: avg test  loss 838.98, bar  test loss 2.226, len  test loss 0.025, col  test loss 146.608


Epoch 295: 272batch [00:19, 14.28batch/s, loss=842]


epoch 295: avg train loss 795.36, bar train loss 1.966, len train loss 0.023, col train loss 138.861
epoch 295: avg test  loss 839.12, bar  test loss 2.219, len  test loss 0.027, col  test loss 146.589


Epoch 296: 272batch [00:19, 13.90batch/s, loss=764]


epoch 296: avg train loss 795.15, bar train loss 1.966, len train loss 0.023, col train loss 138.805


Epoch 297: 2batch [00:00, 14.29batch/s, loss=781]

epoch 296: avg test  loss 838.77, bar  test loss 2.243, len  test loss 0.026, col  test loss 146.676


Epoch 297: 272batch [00:18, 14.33batch/s, loss=801]


epoch 297: avg train loss 794.87, bar train loss 1.960, len train loss 0.023, col train loss 138.773


Epoch 298: 2batch [00:00, 14.18batch/s, loss=830]

epoch 297: avg test  loss 839.50, bar  test loss 2.217, len  test loss 0.028, col  test loss 146.535


Epoch 298: 272batch [00:18, 14.35batch/s, loss=811]


epoch 298: avg train loss 794.62, bar train loss 1.961, len train loss 0.023, col train loss 138.707


Epoch 299: 2batch [00:00, 13.99batch/s, loss=803]

epoch 298: avg test  loss 838.78, bar  test loss 2.241, len  test loss 0.025, col  test loss 146.691


Epoch 299: 272batch [00:18, 14.32batch/s, loss=771]


epoch 299: avg train loss 794.53, bar train loss 1.957, len train loss 0.022, col train loss 138.709


Epoch 300: 2batch [00:00, 13.79batch/s, loss=777]

epoch 299: avg test  loss 838.68, bar  test loss 2.235, len  test loss 0.025, col  test loss 146.542


Epoch 300: 272batch [00:18, 14.32batch/s, loss=761]


epoch 300: avg train loss 794.14, bar train loss 1.954, len train loss 0.023, col train loss 138.615
epoch 300: avg test  loss 838.33, bar  test loss 2.214, len  test loss 0.025, col  test loss 146.534


Epoch 301: 272batch [00:19, 14.17batch/s, loss=817]


epoch 301: avg train loss 793.79, bar train loss 1.951, len train loss 0.023, col train loss 138.549


Epoch 302: 2batch [00:00, 14.39batch/s, loss=795]

epoch 301: avg test  loss 838.34, bar  test loss 2.232, len  test loss 0.025, col  test loss 146.556


Epoch 302: 272batch [00:18, 14.33batch/s, loss=799]


epoch 302: avg train loss 793.64, bar train loss 1.949, len train loss 0.022, col train loss 138.510


Epoch 303: 2batch [00:00, 14.49batch/s, loss=773]

epoch 302: avg test  loss 838.35, bar  test loss 2.229, len  test loss 0.026, col  test loss 146.566


Epoch 303: 272batch [00:18, 14.36batch/s, loss=782]


epoch 303: avg train loss 793.51, bar train loss 1.949, len train loss 0.022, col train loss 138.481


Epoch 304: 2batch [00:00, 14.39batch/s, loss=783]

epoch 303: avg test  loss 837.83, bar  test loss 2.227, len  test loss 0.026, col  test loss 146.526


Epoch 304: 272batch [00:19, 14.29batch/s, loss=833]


epoch 304: avg train loss 793.32, bar train loss 1.947, len train loss 0.022, col train loss 138.441


Epoch 305: 2batch [00:00, 14.39batch/s, loss=770]

epoch 304: avg test  loss 838.90, bar  test loss 2.226, len  test loss 0.027, col  test loss 146.389


Epoch 305: 272batch [00:18, 14.32batch/s, loss=829]


epoch 305: avg train loss 793.11, bar train loss 1.942, len train loss 0.023, col train loss 138.395
epoch 305: avg test  loss 838.11, bar  test loss 2.214, len  test loss 0.027, col  test loss 146.439


Epoch 306: 272batch [00:19, 14.09batch/s, loss=798]


epoch 306: avg train loss 792.70, bar train loss 1.938, len train loss 0.023, col train loss 138.306


Epoch 307: 2batch [00:00, 14.08batch/s, loss=798]

epoch 306: avg test  loss 838.25, bar  test loss 2.217, len  test loss 0.025, col  test loss 146.491


Epoch 307: 272batch [00:18, 14.35batch/s, loss=854]


epoch 307: avg train loss 792.43, bar train loss 1.937, len train loss 0.022, col train loss 138.273


Epoch 308: 2batch [00:00, 14.49batch/s, loss=831]

epoch 307: avg test  loss 838.10, bar  test loss 2.209, len  test loss 0.027, col  test loss 146.419


Epoch 308: 272batch [00:19, 14.29batch/s, loss=749]


epoch 308: avg train loss 792.35, bar train loss 1.935, len train loss 0.023, col train loss 138.239


Epoch 309: 2batch [00:00, 14.18batch/s, loss=804]

epoch 308: avg test  loss 838.18, bar  test loss 2.212, len  test loss 0.025, col  test loss 146.382


Epoch 309: 272batch [00:19, 14.29batch/s, loss=753]


epoch 309: avg train loss 792.15, bar train loss 1.932, len train loss 0.023, col train loss 138.205


Epoch 310: 2batch [00:00, 14.18batch/s, loss=785]

epoch 309: avg test  loss 837.82, bar  test loss 2.215, len  test loss 0.025, col  test loss 146.417


Epoch 310: 272batch [00:19, 14.28batch/s, loss=799]


epoch 310: avg train loss 791.91, bar train loss 1.932, len train loss 0.022, col train loss 138.157
epoch 310: avg test  loss 838.33, bar  test loss 2.211, len  test loss 0.030, col  test loss 146.431


Epoch 311: 272batch [00:19, 14.09batch/s, loss=692]


epoch 311: avg train loss 791.54, bar train loss 1.928, len train loss 0.022, col train loss 138.080


Epoch 312: 2batch [00:00, 14.39batch/s, loss=765]

epoch 311: avg test  loss 837.83, bar  test loss 2.206, len  test loss 0.025, col  test loss 146.365


Epoch 312: 272batch [00:18, 14.32batch/s, loss=803]


epoch 312: avg train loss 791.36, bar train loss 1.921, len train loss 0.022, col train loss 138.065


Epoch 313: 2batch [00:00, 13.89batch/s, loss=767]

epoch 312: avg test  loss 837.73, bar  test loss 2.196, len  test loss 0.025, col  test loss 146.370


Epoch 313: 272batch [00:18, 14.32batch/s, loss=789]


epoch 313: avg train loss 791.14, bar train loss 1.923, len train loss 0.022, col train loss 137.993


Epoch 314: 2batch [00:00, 13.99batch/s, loss=767]

epoch 313: avg test  loss 838.04, bar  test loss 2.205, len  test loss 0.029, col  test loss 146.337


Epoch 314: 272batch [00:19, 14.31batch/s, loss=745]


epoch 314: avg train loss 790.96, bar train loss 1.923, len train loss 0.022, col train loss 137.953


Epoch 315: 2batch [00:00, 13.89batch/s, loss=793]

epoch 314: avg test  loss 837.58, bar  test loss 2.205, len  test loss 0.026, col  test loss 146.381


Epoch 315: 272batch [00:18, 14.32batch/s, loss=757]


epoch 315: avg train loss 790.61, bar train loss 1.919, len train loss 0.022, col train loss 137.905
epoch 315: avg test  loss 838.24, bar  test loss 2.202, len  test loss 0.026, col  test loss 146.294


Epoch 316: 272batch [00:19, 14.09batch/s, loss=783]


epoch 316: avg train loss 790.44, bar train loss 1.918, len train loss 0.022, col train loss 137.853


Epoch 317: 2batch [00:00, 13.25batch/s, loss=764]

epoch 316: avg test  loss 837.81, bar  test loss 2.206, len  test loss 0.026, col  test loss 146.308


Epoch 317: 272batch [00:19, 14.28batch/s, loss=795]


epoch 317: avg train loss 790.24, bar train loss 1.917, len train loss 0.022, col train loss 137.804


Epoch 318: 2batch [00:00, 14.49batch/s, loss=786]

epoch 317: avg test  loss 837.62, bar  test loss 2.201, len  test loss 0.027, col  test loss 146.260


Epoch 318: 272batch [00:18, 14.34batch/s, loss=843]


epoch 318: avg train loss 790.12, bar train loss 1.917, len train loss 0.023, col train loss 137.773


Epoch 319: 2batch [00:00, 14.39batch/s, loss=790]

epoch 318: avg test  loss 837.61, bar  test loss 2.205, len  test loss 0.026, col  test loss 146.258


Epoch 319: 272batch [00:18, 14.33batch/s, loss=832]


epoch 319: avg train loss 789.93, bar train loss 1.914, len train loss 0.022, col train loss 137.743


Epoch 320: 2batch [00:00, 14.29batch/s, loss=762]

epoch 319: avg test  loss 837.92, bar  test loss 2.187, len  test loss 0.026, col  test loss 146.298


Epoch 320: 272batch [00:19, 14.30batch/s, loss=750]


epoch 320: avg train loss 789.53, bar train loss 1.909, len train loss 0.023, col train loss 137.658
epoch 320: avg test  loss 837.43, bar  test loss 2.197, len  test loss 0.027, col  test loss 146.192


Epoch 321: 272batch [00:20, 13.55batch/s, loss=757]


epoch 321: avg train loss 789.44, bar train loss 1.907, len train loss 0.022, col train loss 137.617


Epoch 322: 2batch [00:00, 14.29batch/s, loss=811]

epoch 321: avg test  loss 837.55, bar  test loss 2.213, len  test loss 0.027, col  test loss 146.340


Epoch 322: 272batch [00:19, 14.27batch/s, loss=881]


epoch 322: avg train loss 789.17, bar train loss 1.908, len train loss 0.022, col train loss 137.567


Epoch 323: 2batch [00:00, 14.18batch/s, loss=809]

epoch 322: avg test  loss 837.69, bar  test loss 2.204, len  test loss 0.026, col  test loss 146.257


Epoch 323: 272batch [00:19, 14.28batch/s, loss=807]


epoch 323: avg train loss 789.11, bar train loss 1.903, len train loss 0.022, col train loss 137.565


Epoch 324: 2batch [00:00, 14.18batch/s, loss=773]

epoch 323: avg test  loss 837.40, bar  test loss 2.198, len  test loss 0.026, col  test loss 146.128


Epoch 324: 272batch [00:19, 14.30batch/s, loss=755]


epoch 324: avg train loss 788.69, bar train loss 1.901, len train loss 0.022, col train loss 137.493


Epoch 325: 2batch [00:00, 13.99batch/s, loss=779]

epoch 324: avg test  loss 836.87, bar  test loss 2.195, len  test loss 0.026, col  test loss 146.195


Epoch 325: 272batch [00:19, 14.30batch/s, loss=832]


epoch 325: avg train loss 788.68, bar train loss 1.896, len train loss 0.023, col train loss 137.471
epoch 325: avg test  loss 837.64, bar  test loss 2.196, len  test loss 0.026, col  test loss 146.206


Epoch 326: 272batch [00:19, 14.15batch/s, loss=750]


epoch 326: avg train loss 788.35, bar train loss 1.897, len train loss 0.022, col train loss 137.401


Epoch 327: 2batch [00:00, 14.39batch/s, loss=761]

epoch 326: avg test  loss 837.45, bar  test loss 2.193, len  test loss 0.027, col  test loss 146.186


Epoch 327: 272batch [00:19, 14.30batch/s, loss=709]


epoch 327: avg train loss 788.18, bar train loss 1.895, len train loss 0.022, col train loss 137.381


Epoch 328: 2batch [00:00, 14.39batch/s, loss=771]

epoch 327: avg test  loss 837.23, bar  test loss 2.192, len  test loss 0.025, col  test loss 146.159


Epoch 328: 272batch [00:19, 14.28batch/s, loss=791]


epoch 328: avg train loss 787.91, bar train loss 1.895, len train loss 0.022, col train loss 137.319


Epoch 329: 2batch [00:00, 14.29batch/s, loss=772]

epoch 328: avg test  loss 837.05, bar  test loss 2.178, len  test loss 0.025, col  test loss 146.176


Epoch 329: 272batch [00:19, 14.28batch/s, loss=787]


epoch 329: avg train loss 787.82, bar train loss 1.889, len train loss 0.022, col train loss 137.297


Epoch 330: 2batch [00:00, 14.39batch/s, loss=799]

epoch 329: avg test  loss 836.92, bar  test loss 2.198, len  test loss 0.028, col  test loss 146.109


Epoch 330: 272batch [00:19, 14.27batch/s, loss=727]


epoch 330: avg train loss 787.48, bar train loss 1.890, len train loss 0.022, col train loss 137.221
epoch 330: avg test  loss 837.51, bar  test loss 2.185, len  test loss 0.027, col  test loss 146.080


Epoch 331: 272batch [00:19, 14.05batch/s, loss=865]


epoch 331: avg train loss 787.37, bar train loss 1.890, len train loss 0.022, col train loss 137.200


Epoch 332: 2batch [00:00, 13.79batch/s, loss=801]

epoch 331: avg test  loss 837.20, bar  test loss 2.193, len  test loss 0.027, col  test loss 146.063


Epoch 332: 272batch [00:19, 14.26batch/s, loss=765]


epoch 332: avg train loss 787.12, bar train loss 1.883, len train loss 0.022, col train loss 137.133


Epoch 333: 2batch [00:00, 14.60batch/s, loss=824]

epoch 332: avg test  loss 836.87, bar  test loss 2.201, len  test loss 0.027, col  test loss 146.098


Epoch 333: 272batch [00:19, 14.27batch/s, loss=819]


epoch 333: avg train loss 786.86, bar train loss 1.886, len train loss 0.022, col train loss 137.095


Epoch 334: 2batch [00:00, 14.18batch/s, loss=808]

epoch 333: avg test  loss 836.98, bar  test loss 2.182, len  test loss 0.026, col  test loss 146.048


Epoch 334: 272batch [00:19, 14.26batch/s, loss=820]


epoch 334: avg train loss 786.68, bar train loss 1.881, len train loss 0.022, col train loss 137.036


Epoch 335: 2batch [00:00, 13.99batch/s, loss=772]

epoch 334: avg test  loss 836.98, bar  test loss 2.203, len  test loss 0.027, col  test loss 146.132


Epoch 335: 272batch [00:19, 14.19batch/s, loss=769]


epoch 335: avg train loss 786.51, bar train loss 1.876, len train loss 0.022, col train loss 137.010
epoch 335: avg test  loss 837.17, bar  test loss 2.168, len  test loss 0.025, col  test loss 145.904


Epoch 336: 272batch [00:19, 13.81batch/s, loss=800]


epoch 336: avg train loss 786.32, bar train loss 1.877, len train loss 0.022, col train loss 136.965


Epoch 337: 2batch [00:00, 14.18batch/s, loss=806]

epoch 336: avg test  loss 836.93, bar  test loss 2.161, len  test loss 0.026, col  test loss 146.025


Epoch 337: 272batch [00:19, 14.20batch/s, loss=814]


epoch 337: avg train loss 786.04, bar train loss 1.874, len train loss 0.022, col train loss 136.911


Epoch 338: 2batch [00:00, 13.99batch/s, loss=814]

epoch 337: avg test  loss 836.66, bar  test loss 2.191, len  test loss 0.027, col  test loss 146.114


Epoch 338: 272batch [00:19, 14.24batch/s, loss=852]


epoch 338: avg train loss 785.97, bar train loss 1.874, len train loss 0.022, col train loss 136.897


Epoch 339: 2batch [00:00, 13.70batch/s, loss=766]

epoch 338: avg test  loss 836.64, bar  test loss 2.177, len  test loss 0.025, col  test loss 145.949


Epoch 339: 272batch [00:19, 14.21batch/s, loss=768]


epoch 339: avg train loss 785.57, bar train loss 1.871, len train loss 0.022, col train loss 136.820


Epoch 340: 2batch [00:00, 13.70batch/s, loss=783]

epoch 339: avg test  loss 836.84, bar  test loss 2.178, len  test loss 0.027, col  test loss 145.956


Epoch 340: 272batch [00:19, 14.17batch/s, loss=823]


epoch 340: avg train loss 785.55, bar train loss 1.872, len train loss 0.022, col train loss 136.789
epoch 340: avg test  loss 836.82, bar  test loss 2.182, len  test loss 0.025, col  test loss 145.880


Epoch 341: 272batch [00:19, 13.75batch/s, loss=748]


epoch 341: avg train loss 785.19, bar train loss 1.868, len train loss 0.022, col train loss 136.732


Epoch 342: 2batch [00:00, 14.49batch/s, loss=791]

epoch 341: avg test  loss 836.50, bar  test loss 2.173, len  test loss 0.026, col  test loss 145.971


Epoch 342: 272batch [00:19, 14.27batch/s, loss=789]


epoch 342: avg train loss 784.93, bar train loss 1.867, len train loss 0.022, col train loss 136.679


Epoch 343: 2batch [00:00, 13.89batch/s, loss=798]

epoch 342: avg test  loss 836.48, bar  test loss 2.180, len  test loss 0.025, col  test loss 145.905


Epoch 343: 272batch [00:19, 14.25batch/s, loss=797]


epoch 343: avg train loss 784.79, bar train loss 1.863, len train loss 0.022, col train loss 136.633


Epoch 344: 2batch [00:00, 14.08batch/s, loss=736]

epoch 343: avg test  loss 836.04, bar  test loss 2.178, len  test loss 0.025, col  test loss 145.901


Epoch 344: 272batch [00:19, 14.24batch/s, loss=810]


epoch 344: avg train loss 784.53, bar train loss 1.864, len train loss 0.022, col train loss 136.582


Epoch 345: 2batch [00:00, 13.51batch/s, loss=751]

epoch 344: avg test  loss 835.99, bar  test loss 2.177, len  test loss 0.025, col  test loss 145.820


Epoch 345: 272batch [00:19, 14.24batch/s, loss=832]


epoch 345: avg train loss 784.46, bar train loss 1.864, len train loss 0.022, col train loss 136.560
epoch 345: avg test  loss 836.20, bar  test loss 2.162, len  test loss 0.026, col  test loss 145.884


Epoch 346: 272batch [00:19, 13.92batch/s, loss=792]


epoch 346: avg train loss 784.35, bar train loss 1.860, len train loss 0.022, col train loss 136.532


Epoch 347: 2batch [00:00, 14.29batch/s, loss=818]

epoch 346: avg test  loss 836.26, bar  test loss 2.174, len  test loss 0.026, col  test loss 145.834


Epoch 347: 272batch [00:19, 14.23batch/s, loss=831]


epoch 347: avg train loss 783.94, bar train loss 1.855, len train loss 0.022, col train loss 136.469


Epoch 348: 2batch [00:00, 14.49batch/s, loss=797]

epoch 347: avg test  loss 836.22, bar  test loss 2.166, len  test loss 0.025, col  test loss 145.821


Epoch 348: 272batch [00:19, 14.19batch/s, loss=841]


epoch 348: avg train loss 783.77, bar train loss 1.854, len train loss 0.022, col train loss 136.439


Epoch 349: 2batch [00:00, 13.89batch/s, loss=778]

epoch 348: avg test  loss 836.56, bar  test loss 2.162, len  test loss 0.025, col  test loss 145.803


Epoch 349: 272batch [00:19, 14.22batch/s, loss=741]


epoch 349: avg train loss 783.55, bar train loss 1.851, len train loss 0.022, col train loss 136.372


Epoch 350: 2batch [00:00, 14.60batch/s, loss=776]

epoch 349: avg test  loss 836.55, bar  test loss 2.158, len  test loss 0.027, col  test loss 145.742


Epoch 350: 272batch [00:19, 14.25batch/s, loss=819]


epoch 350: avg train loss 783.41, bar train loss 1.850, len train loss 0.022, col train loss 136.357
epoch 350: avg test  loss 836.36, bar  test loss 2.167, len  test loss 0.025, col  test loss 145.773


Epoch 351: 272batch [00:19, 13.98batch/s, loss=771]


epoch 351: avg train loss 783.29, bar train loss 1.850, len train loss 0.022, col train loss 136.306


Epoch 352: 2batch [00:00, 14.29batch/s, loss=758]

epoch 351: avg test  loss 836.46, bar  test loss 2.163, len  test loss 0.030, col  test loss 145.682


Epoch 352: 272batch [00:19, 14.24batch/s, loss=769]


epoch 352: avg train loss 782.98, bar train loss 1.848, len train loss 0.022, col train loss 136.247


Epoch 353: 2batch [00:00, 13.89batch/s, loss=791]

epoch 352: avg test  loss 836.44, bar  test loss 2.182, len  test loss 0.030, col  test loss 145.795


Epoch 353: 272batch [00:19, 14.24batch/s, loss=765]


epoch 353: avg train loss 782.73, bar train loss 1.844, len train loss 0.022, col train loss 136.192


Epoch 354: 2batch [00:00, 14.29batch/s, loss=770]

epoch 353: avg test  loss 836.33, bar  test loss 2.171, len  test loss 0.026, col  test loss 145.829


Epoch 354: 272batch [00:19, 14.22batch/s, loss=792]


epoch 354: avg train loss 782.54, bar train loss 1.844, len train loss 0.022, col train loss 136.158


Epoch 355: 2batch [00:00, 13.89batch/s, loss=818]

epoch 354: avg test  loss 835.78, bar  test loss 2.169, len  test loss 0.025, col  test loss 145.674


Epoch 355: 272batch [00:19, 14.20batch/s, loss=729]


epoch 355: avg train loss 782.35, bar train loss 1.839, len train loss 0.022, col train loss 136.131
epoch 355: avg test  loss 836.13, bar  test loss 2.146, len  test loss 0.026, col  test loss 145.757


Epoch 356: 272batch [00:19, 13.97batch/s, loss=726]


epoch 356: avg train loss 782.19, bar train loss 1.838, len train loss 0.022, col train loss 136.092


Epoch 357: 2batch [00:00, 13.79batch/s, loss=767]

epoch 356: avg test  loss 836.00, bar  test loss 2.161, len  test loss 0.026, col  test loss 145.595


Epoch 357: 272batch [00:19, 14.24batch/s, loss=818]


epoch 357: avg train loss 781.84, bar train loss 1.837, len train loss 0.022, col train loss 136.021


Epoch 358: 2batch [00:00, 14.49batch/s, loss=765]

epoch 357: avg test  loss 836.32, bar  test loss 2.179, len  test loss 0.027, col  test loss 145.658


Epoch 358: 272batch [00:19, 14.22batch/s, loss=720]


epoch 358: avg train loss 781.65, bar train loss 1.839, len train loss 0.022, col train loss 135.957


Epoch 359: 2batch [00:00, 14.29batch/s, loss=795]

epoch 358: avg test  loss 836.00, bar  test loss 2.152, len  test loss 0.028, col  test loss 145.665


Epoch 359: 272batch [00:19, 14.19batch/s, loss=820]


epoch 359: avg train loss 781.51, bar train loss 1.833, len train loss 0.022, col train loss 135.950


Epoch 360: 2batch [00:00, 13.70batch/s, loss=782]

epoch 359: avg test  loss 835.36, bar  test loss 2.167, len  test loss 0.028, col  test loss 145.662


Epoch 360: 272batch [00:19, 14.21batch/s, loss=757]


epoch 360: avg train loss 781.25, bar train loss 1.832, len train loss 0.022, col train loss 135.898
epoch 360: avg test  loss 835.44, bar  test loss 2.151, len  test loss 0.026, col  test loss 145.646


Epoch 361: 272batch [00:19, 13.93batch/s, loss=846]


epoch 361: avg train loss 781.14, bar train loss 1.830, len train loss 0.022, col train loss 135.850


Epoch 362: 2batch [00:00, 14.18batch/s, loss=754]

epoch 361: avg test  loss 835.77, bar  test loss 2.156, len  test loss 0.025, col  test loss 145.587


Epoch 362: 272batch [00:19, 14.23batch/s, loss=869]


epoch 362: avg train loss 781.01, bar train loss 1.830, len train loss 0.022, col train loss 135.835


Epoch 363: 2batch [00:00, 14.29batch/s, loss=783]

epoch 362: avg test  loss 835.11, bar  test loss 2.155, len  test loss 0.025, col  test loss 145.579


Epoch 363: 272batch [00:19, 14.19batch/s, loss=816]


epoch 363: avg train loss 780.57, bar train loss 1.826, len train loss 0.021, col train loss 135.757


Epoch 364: 2batch [00:00, 14.29batch/s, loss=763]

epoch 363: avg test  loss 836.18, bar  test loss 2.150, len  test loss 0.029, col  test loss 145.580


Epoch 364: 272batch [00:19, 14.17batch/s, loss=773]


epoch 364: avg train loss 780.53, bar train loss 1.824, len train loss 0.022, col train loss 135.727


Epoch 365: 2batch [00:00, 14.18batch/s, loss=791]

epoch 364: avg test  loss 835.87, bar  test loss 2.144, len  test loss 0.025, col  test loss 145.534


Epoch 365: 272batch [00:19, 14.21batch/s, loss=832]


epoch 365: avg train loss 780.32, bar train loss 1.823, len train loss 0.022, col train loss 135.674
epoch 365: avg test  loss 835.60, bar  test loss 2.148, len  test loss 0.025, col  test loss 145.551


Epoch 366: 272batch [00:19, 13.99batch/s, loss=770]


epoch 366: avg train loss 780.05, bar train loss 1.818, len train loss 0.022, col train loss 135.639


Epoch 367: 2batch [00:00, 14.60batch/s, loss=830]

epoch 366: avg test  loss 835.74, bar  test loss 2.148, len  test loss 0.027, col  test loss 145.503


Epoch 367: 272batch [00:19, 14.21batch/s, loss=761]


epoch 367: avg train loss 779.81, bar train loss 1.818, len train loss 0.022, col train loss 135.577


Epoch 368: 0batch [00:00, ?batch/s, loss=742]

epoch 367: avg test  loss 836.05, bar  test loss 2.148, len  test loss 0.026, col  test loss 145.500


Epoch 368: 272batch [00:19, 14.12batch/s, loss=821]


epoch 368: avg train loss 779.63, bar train loss 1.818, len train loss 0.022, col train loss 135.538


Epoch 369: 2batch [00:00, 14.08batch/s, loss=741]

epoch 368: avg test  loss 835.84, bar  test loss 2.147, len  test loss 0.027, col  test loss 145.555


Epoch 369: 272batch [00:19, 14.16batch/s, loss=758]


epoch 369: avg train loss 779.40, bar train loss 1.816, len train loss 0.022, col train loss 135.464


Epoch 370: 2batch [00:00, 13.99batch/s, loss=761]

epoch 369: avg test  loss 835.84, bar  test loss 2.148, len  test loss 0.027, col  test loss 145.446


Epoch 370: 272batch [00:19, 14.15batch/s, loss=787]


epoch 370: avg train loss 779.33, bar train loss 1.815, len train loss 0.021, col train loss 135.471
epoch 370: avg test  loss 834.73, bar  test loss 2.153, len  test loss 0.026, col  test loss 145.451


Epoch 371: 272batch [00:19, 13.92batch/s, loss=748]


epoch 371: avg train loss 779.11, bar train loss 1.813, len train loss 0.022, col train loss 135.408


Epoch 372: 2batch [00:00, 13.99batch/s, loss=801]

epoch 371: avg test  loss 835.54, bar  test loss 2.149, len  test loss 0.025, col  test loss 145.489


Epoch 372: 272batch [00:19, 14.17batch/s, loss=794]


epoch 372: avg train loss 778.77, bar train loss 1.810, len train loss 0.021, col train loss 135.348


Epoch 373: 2batch [00:00, 14.08batch/s, loss=757]

epoch 372: avg test  loss 835.11, bar  test loss 2.144, len  test loss 0.026, col  test loss 145.467


Epoch 373: 272batch [00:19, 14.18batch/s, loss=835]


epoch 373: avg train loss 778.67, bar train loss 1.811, len train loss 0.021, col train loss 135.322


Epoch 374: 2batch [00:00, 14.18batch/s, loss=790]

epoch 373: avg test  loss 835.45, bar  test loss 2.160, len  test loss 0.026, col  test loss 145.481


Epoch 374: 272batch [00:19, 14.12batch/s, loss=837]


epoch 374: avg train loss 778.49, bar train loss 1.806, len train loss 0.022, col train loss 135.272


Epoch 375: 2batch [00:00, 14.08batch/s, loss=755]

epoch 374: avg test  loss 834.95, bar  test loss 2.144, len  test loss 0.025, col  test loss 145.393


Epoch 375: 272batch [00:19, 14.24batch/s, loss=771]


epoch 375: avg train loss 778.32, bar train loss 1.805, len train loss 0.021, col train loss 135.261
epoch 375: avg test  loss 834.74, bar  test loss 2.153, len  test loss 0.026, col  test loss 145.410


Epoch 376: 272batch [00:19, 13.87batch/s, loss=748]


epoch 376: avg train loss 778.18, bar train loss 1.803, len train loss 0.021, col train loss 135.209


Epoch 377: 2batch [00:00, 14.18batch/s, loss=792]

epoch 376: avg test  loss 834.96, bar  test loss 2.144, len  test loss 0.026, col  test loss 145.434


Epoch 377: 272batch [00:19, 14.17batch/s, loss=825]


epoch 377: avg train loss 777.91, bar train loss 1.802, len train loss 0.022, col train loss 135.162


Epoch 378: 2batch [00:00, 14.18batch/s, loss=798]

epoch 377: avg test  loss 834.45, bar  test loss 2.146, len  test loss 0.025, col  test loss 145.345


Epoch 378: 272batch [00:19, 13.81batch/s, loss=808]


epoch 378: avg train loss 777.58, bar train loss 1.798, len train loss 0.022, col train loss 135.095


Epoch 379: 2batch [00:00, 13.79batch/s, loss=786]

epoch 378: avg test  loss 835.26, bar  test loss 2.143, len  test loss 0.025, col  test loss 145.381


Epoch 379: 272batch [00:19, 14.18batch/s, loss=819]


epoch 379: avg train loss 777.31, bar train loss 1.798, len train loss 0.021, col train loss 135.055


Epoch 380: 2batch [00:00, 14.08batch/s, loss=750]

epoch 379: avg test  loss 835.16, bar  test loss 2.147, len  test loss 0.025, col  test loss 145.417


Epoch 380: 272batch [00:19, 14.16batch/s, loss=819]


epoch 380: avg train loss 777.15, bar train loss 1.792, len train loss 0.021, col train loss 135.017
epoch 380: avg test  loss 835.23, bar  test loss 2.137, len  test loss 0.025, col  test loss 145.395


Epoch 381: 272batch [00:19, 13.96batch/s, loss=758]


epoch 381: avg train loss 777.07, bar train loss 1.791, len train loss 0.021, col train loss 135.011


Epoch 382: 1batch [00:00,  7.46batch/s, loss=769]

epoch 381: avg test  loss 835.46, bar  test loss 2.130, len  test loss 0.027, col  test loss 145.347


Epoch 382: 272batch [00:19, 14.01batch/s, loss=827]


epoch 382: avg train loss 776.84, bar train loss 1.792, len train loss 0.021, col train loss 134.962


Epoch 383: 2batch [00:00, 14.08batch/s, loss=784]

epoch 382: avg test  loss 834.73, bar  test loss 2.134, len  test loss 0.026, col  test loss 145.235


Epoch 383: 272batch [00:19, 14.10batch/s, loss=819]


epoch 383: avg train loss 776.67, bar train loss 1.792, len train loss 0.021, col train loss 134.896


Epoch 384: 2batch [00:00, 14.49batch/s, loss=760]

epoch 383: avg test  loss 835.06, bar  test loss 2.132, len  test loss 0.025, col  test loss 145.255


Epoch 384: 272batch [00:19, 14.14batch/s, loss=763]


epoch 384: avg train loss 776.50, bar train loss 1.792, len train loss 0.022, col train loss 134.868


Epoch 385: 2batch [00:00, 12.42batch/s, loss=800]

epoch 384: avg test  loss 835.07, bar  test loss 2.140, len  test loss 0.026, col  test loss 145.272


Epoch 385: 272batch [00:19, 14.15batch/s, loss=733]


epoch 385: avg train loss 776.30, bar train loss 1.786, len train loss 0.022, col train loss 134.842
epoch 385: avg test  loss 834.87, bar  test loss 2.147, len  test loss 0.026, col  test loss 145.333


Epoch 386: 272batch [00:19, 13.88batch/s, loss=763]


epoch 386: avg train loss 776.11, bar train loss 1.784, len train loss 0.021, col train loss 134.783


Epoch 387: 2batch [00:00, 13.99batch/s, loss=783]

epoch 386: avg test  loss 835.42, bar  test loss 2.135, len  test loss 0.026, col  test loss 145.269


Epoch 387: 272batch [00:19, 14.15batch/s, loss=764]


epoch 387: avg train loss 775.89, bar train loss 1.783, len train loss 0.021, col train loss 134.740


Epoch 388: 2batch [00:00, 14.08batch/s, loss=763]

epoch 387: avg test  loss 834.83, bar  test loss 2.138, len  test loss 0.026, col  test loss 145.284


Epoch 388: 272batch [00:19, 14.15batch/s, loss=766]


epoch 388: avg train loss 775.53, bar train loss 1.780, len train loss 0.021, col train loss 134.690


Epoch 389: 2batch [00:00, 13.99batch/s, loss=790]

epoch 388: avg test  loss 834.87, bar  test loss 2.133, len  test loss 0.025, col  test loss 145.258


Epoch 389: 272batch [00:19, 14.15batch/s, loss=825]


epoch 389: avg train loss 775.51, bar train loss 1.780, len train loss 0.021, col train loss 134.656


Epoch 390: 2batch [00:00, 14.18batch/s, loss=796]

epoch 389: avg test  loss 834.42, bar  test loss 2.129, len  test loss 0.026, col  test loss 145.249


Epoch 390: 272batch [00:19, 14.15batch/s, loss=823]


epoch 390: avg train loss 775.19, bar train loss 1.779, len train loss 0.021, col train loss 134.598
epoch 390: avg test  loss 834.71, bar  test loss 2.132, len  test loss 0.025, col  test loss 145.225


Epoch 391: 272batch [00:19, 13.73batch/s, loss=733]


epoch 391: avg train loss 775.11, bar train loss 1.776, len train loss 0.021, col train loss 134.577


Epoch 392: 0batch [00:00, ?batch/s]

epoch 391: avg test  loss 834.15, bar  test loss 2.133, len  test loss 0.025, col  test loss 145.306


Epoch 392: 272batch [00:37,  7.29batch/s, loss=821]


epoch 392: avg train loss 774.83, bar train loss 1.776, len train loss 0.021, col train loss 134.526
epoch 392: avg test  loss 834.92, bar  test loss 2.143, len  test loss 0.029, col  test loss 145.244


Epoch 393: 272batch [00:20, 13.35batch/s, loss=765]


epoch 393: avg train loss 774.79, bar train loss 1.776, len train loss 0.021, col train loss 134.498


Epoch 394: 2batch [00:00, 13.79batch/s, loss=792]

epoch 393: avg test  loss 834.79, bar  test loss 2.123, len  test loss 0.025, col  test loss 145.157


Epoch 394: 272batch [00:19, 14.04batch/s, loss=777]


epoch 394: avg train loss 774.44, bar train loss 1.772, len train loss 0.021, col train loss 134.428


Epoch 395: 2batch [00:00, 13.70batch/s, loss=779]

epoch 394: avg test  loss 834.69, bar  test loss 2.113, len  test loss 0.025, col  test loss 145.087


Epoch 395: 272batch [00:19, 14.04batch/s, loss=791]


epoch 395: avg train loss 774.43, bar train loss 1.775, len train loss 0.021, col train loss 134.423
epoch 395: avg test  loss 834.63, bar  test loss 2.121, len  test loss 0.026, col  test loss 145.135


Epoch 396: 272batch [00:20, 13.44batch/s, loss=755]


epoch 396: avg train loss 774.04, bar train loss 1.768, len train loss 0.021, col train loss 134.359


Epoch 397: 2batch [00:00, 13.42batch/s, loss=747]

epoch 396: avg test  loss 834.68, bar  test loss 2.106, len  test loss 0.026, col  test loss 145.139


Epoch 397: 272batch [00:21, 12.66batch/s, loss=737]


epoch 397: avg train loss 773.91, bar train loss 1.769, len train loss 0.021, col train loss 134.322


Epoch 398: 1batch [00:00,  9.52batch/s, loss=745]

epoch 397: avg test  loss 834.64, bar  test loss 2.137, len  test loss 0.027, col  test loss 145.160


Epoch 398: 272batch [00:22, 12.30batch/s, loss=728]


epoch 398: avg train loss 773.75, bar train loss 1.768, len train loss 0.021, col train loss 134.290


Epoch 399: 2batch [00:00, 12.66batch/s, loss=806]

epoch 398: avg test  loss 834.70, bar  test loss 2.115, len  test loss 0.025, col  test loss 145.107


Epoch 399: 272batch [00:22, 12.29batch/s, loss=800]


epoch 399: avg train loss 773.61, bar train loss 1.766, len train loss 0.021, col train loss 134.259


Epoch 400: 0batch [00:00, ?batch/s, loss=753]

epoch 399: avg test  loss 834.74, bar  test loss 2.128, len  test loss 0.025, col  test loss 145.086


Epoch 400: 272batch [00:21, 12.60batch/s, loss=732]


epoch 400: avg train loss 773.41, bar train loss 1.763, len train loss 0.021, col train loss 134.220
epoch 400: avg test  loss 834.60, bar  test loss 2.122, len  test loss 0.026, col  test loss 145.130


Epoch 401: 272batch [00:20, 13.08batch/s, loss=786]


epoch 401: avg train loss 773.27, bar train loss 1.762, len train loss 0.021, col train loss 134.171


Epoch 402: 0batch [00:00, ?batch/s, loss=758]

epoch 401: avg test  loss 834.64, bar  test loss 2.136, len  test loss 0.027, col  test loss 145.038


Epoch 402: 272batch [00:19, 14.00batch/s, loss=742]


epoch 402: avg train loss 772.95, bar train loss 1.761, len train loss 0.021, col train loss 134.111


Epoch 403: 1batch [00:00,  9.90batch/s, loss=794]

epoch 402: avg test  loss 834.08, bar  test loss 2.121, len  test loss 0.026, col  test loss 145.033


Epoch 403: 272batch [00:19, 13.85batch/s, loss=728]


epoch 403: avg train loss 772.75, bar train loss 1.758, len train loss 0.020, col train loss 134.088


Epoch 404: 2batch [00:00, 12.20batch/s, loss=764]

epoch 403: avg test  loss 834.02, bar  test loss 2.117, len  test loss 0.026, col  test loss 145.073


Epoch 404: 272batch [00:22, 12.29batch/s, loss=782]


epoch 404: avg train loss 772.55, bar train loss 1.759, len train loss 0.021, col train loss 134.043


Epoch 405: 2batch [00:00, 12.90batch/s, loss=776]

epoch 404: avg test  loss 834.52, bar  test loss 2.129, len  test loss 0.025, col  test loss 144.996


Epoch 405: 272batch [00:21, 12.84batch/s, loss=780]


epoch 405: avg train loss 772.36, bar train loss 1.755, len train loss 0.021, col train loss 134.002
epoch 405: avg test  loss 834.18, bar  test loss 2.118, len  test loss 0.029, col  test loss 145.048


Epoch 406: 272batch [00:22, 12.00batch/s, loss=794]


epoch 406: avg train loss 772.39, bar train loss 1.757, len train loss 0.022, col train loss 133.973


Epoch 407: 0batch [00:00, ?batch/s, loss=765]

epoch 406: avg test  loss 834.22, bar  test loss 2.121, len  test loss 0.028, col  test loss 145.087


Epoch 407: 272batch [00:21, 12.71batch/s, loss=738]


epoch 407: avg train loss 771.87, bar train loss 1.754, len train loss 0.021, col train loss 133.889


Epoch 408: 2batch [00:00, 12.82batch/s, loss=788]

epoch 407: avg test  loss 834.01, bar  test loss 2.114, len  test loss 0.026, col  test loss 145.028


Epoch 408: 272batch [00:21, 12.74batch/s, loss=721]


epoch 408: avg train loss 771.80, bar train loss 1.749, len train loss 0.020, col train loss 133.874


Epoch 409: 2batch [00:00, 12.74batch/s, loss=769]

epoch 408: avg test  loss 834.03, bar  test loss 2.123, len  test loss 0.025, col  test loss 145.045


Epoch 409: 272batch [00:21, 12.42batch/s, loss=718]


epoch 409: avg train loss 771.77, bar train loss 1.751, len train loss 0.021, col train loss 133.843


Epoch 410: 2batch [00:00, 12.82batch/s, loss=789]

epoch 409: avg test  loss 834.08, bar  test loss 2.111, len  test loss 0.026, col  test loss 145.036


Epoch 410: 272batch [00:21, 12.84batch/s, loss=818]


epoch 410: avg train loss 771.59, bar train loss 1.748, len train loss 0.021, col train loss 133.826
epoch 410: avg test  loss 834.37, bar  test loss 2.107, len  test loss 0.026, col  test loss 145.027


Epoch 411: 272batch [00:22, 12.11batch/s, loss=777]


epoch 411: avg train loss 771.39, bar train loss 1.746, len train loss 0.021, col train loss 133.780


Epoch 412: 1batch [00:00, 10.00batch/s, loss=755]

epoch 411: avg test  loss 834.11, bar  test loss 2.113, len  test loss 0.026, col  test loss 144.921


Epoch 412: 272batch [00:22, 12.29batch/s, loss=737]


epoch 412: avg train loss 771.20, bar train loss 1.746, len train loss 0.021, col train loss 133.739


Epoch 413: 2batch [00:00, 13.33batch/s, loss=760]

epoch 412: avg test  loss 834.15, bar  test loss 2.112, len  test loss 0.026, col  test loss 145.053


Epoch 413: 272batch [00:21, 12.85batch/s, loss=853]


epoch 413: avg train loss 771.08, bar train loss 1.742, len train loss 0.021, col train loss 133.713


Epoch 414: 2batch [00:00, 13.16batch/s, loss=753]

epoch 413: avg test  loss 833.99, bar  test loss 2.130, len  test loss 0.029, col  test loss 144.974


Epoch 414: 272batch [00:21, 12.78batch/s, loss=850]


epoch 414: avg train loss 770.85, bar train loss 1.742, len train loss 0.021, col train loss 133.661


Epoch 415: 2batch [00:00, 13.33batch/s, loss=762]

epoch 414: avg test  loss 834.15, bar  test loss 2.122, len  test loss 0.026, col  test loss 144.958


Epoch 415: 272batch [00:21, 12.85batch/s, loss=779]


epoch 415: avg train loss 770.53, bar train loss 1.740, len train loss 0.021, col train loss 133.598
epoch 415: avg test  loss 834.09, bar  test loss 2.104, len  test loss 0.026, col  test loss 144.993


Epoch 416: 272batch [00:21, 12.57batch/s, loss=802]


epoch 416: avg train loss 770.48, bar train loss 1.739, len train loss 0.021, col train loss 133.572


Epoch 417: 2batch [00:00, 13.02batch/s, loss=763]

epoch 416: avg test  loss 834.08, bar  test loss 2.115, len  test loss 0.027, col  test loss 144.966


Epoch 417: 272batch [00:21, 12.85batch/s, loss=779]


epoch 417: avg train loss 770.09, bar train loss 1.741, len train loss 0.021, col train loss 133.496


Epoch 418: 1batch [00:00,  8.77batch/s, loss=785]

epoch 417: avg test  loss 834.12, bar  test loss 2.109, len  test loss 0.027, col  test loss 144.942


Epoch 418: 272batch [00:21, 12.59batch/s, loss=739]


epoch 418: avg train loss 770.24, bar train loss 1.738, len train loss 0.021, col train loss 133.512


Epoch 419: 2batch [00:00, 12.58batch/s, loss=773]

epoch 418: avg test  loss 834.02, bar  test loss 2.098, len  test loss 0.025, col  test loss 144.906


Epoch 419: 272batch [00:22, 12.30batch/s, loss=793]


epoch 419: avg train loss 769.91, bar train loss 1.737, len train loss 0.021, col train loss 133.457


Epoch 420: 2batch [00:00, 13.25batch/s, loss=772]

epoch 419: avg test  loss 834.37, bar  test loss 2.106, len  test loss 0.025, col  test loss 144.860


Epoch 420: 272batch [00:20, 13.41batch/s, loss=759]


epoch 420: avg train loss 769.81, bar train loss 1.733, len train loss 0.021, col train loss 133.432
epoch 420: avg test  loss 834.03, bar  test loss 2.113, len  test loss 0.027, col  test loss 144.888


Epoch 421: 272batch [00:20, 13.40batch/s, loss=723]


epoch 421: avg train loss 769.64, bar train loss 1.730, len train loss 0.021, col train loss 133.405


Epoch 422: 2batch [00:00, 13.99batch/s, loss=756]

epoch 421: avg test  loss 833.93, bar  test loss 2.110, len  test loss 0.027, col  test loss 144.863


Epoch 422: 272batch [00:19, 13.95batch/s, loss=754]


epoch 422: avg train loss 769.34, bar train loss 1.729, len train loss 0.020, col train loss 133.349


Epoch 423: 2batch [00:00, 13.89batch/s, loss=783]

epoch 422: avg test  loss 834.20, bar  test loss 2.113, len  test loss 0.025, col  test loss 144.900


Epoch 423: 272batch [00:19, 13.93batch/s, loss=773]


epoch 423: avg train loss 769.20, bar train loss 1.731, len train loss 0.021, col train loss 133.302


Epoch 424: 2batch [00:00, 14.08batch/s, loss=775]

epoch 423: avg test  loss 834.13, bar  test loss 2.099, len  test loss 0.026, col  test loss 144.879


Epoch 424: 272batch [00:19, 13.94batch/s, loss=813]


epoch 424: avg train loss 768.89, bar train loss 1.725, len train loss 0.021, col train loss 133.252


Epoch 425: 2batch [00:00, 13.33batch/s, loss=777]

epoch 424: avg test  loss 834.09, bar  test loss 2.106, len  test loss 0.025, col  test loss 144.877


Epoch 425: 272batch [00:19, 13.89batch/s, loss=824]


epoch 425: avg train loss 768.82, bar train loss 1.726, len train loss 0.020, col train loss 133.232
epoch 425: avg test  loss 834.34, bar  test loss 2.115, len  test loss 0.030, col  test loss 144.817


Epoch 426: 272batch [00:20, 13.38batch/s, loss=816]


epoch 426: avg train loss 768.67, bar train loss 1.729, len train loss 0.021, col train loss 133.175


Epoch 427: 2batch [00:00, 13.89batch/s, loss=767]

epoch 426: avg test  loss 834.10, bar  test loss 2.099, len  test loss 0.025, col  test loss 144.770


Epoch 427: 272batch [00:19, 13.98batch/s, loss=809]


epoch 427: avg train loss 768.51, bar train loss 1.724, len train loss 0.020, col train loss 133.175


Epoch 428: 2batch [00:00, 13.79batch/s, loss=756]

epoch 427: avg test  loss 833.91, bar  test loss 2.103, len  test loss 0.026, col  test loss 144.782


Epoch 428: 272batch [00:19, 13.87batch/s, loss=766]


epoch 428: avg train loss 768.29, bar train loss 1.723, len train loss 0.020, col train loss 133.112


Epoch 429: 2batch [00:00, 13.51batch/s, loss=789]

epoch 428: avg test  loss 833.76, bar  test loss 2.102, len  test loss 0.026, col  test loss 144.845


Epoch 429: 272batch [00:19, 13.96batch/s, loss=786]


epoch 429: avg train loss 768.11, bar train loss 1.719, len train loss 0.020, col train loss 133.082


Epoch 430: 2batch [00:00, 13.42batch/s, loss=773]

epoch 429: avg test  loss 833.57, bar  test loss 2.110, len  test loss 0.026, col  test loss 144.810


Epoch 430: 272batch [00:19, 13.84batch/s, loss=818]


epoch 430: avg train loss 768.10, bar train loss 1.722, len train loss 0.021, col train loss 133.064
epoch 430: avg test  loss 833.55, bar  test loss 2.099, len  test loss 0.026, col  test loss 144.797


Epoch 431: 272batch [00:20, 13.36batch/s, loss=730]


epoch 431: avg train loss 767.81, bar train loss 1.717, len train loss 0.021, col train loss 133.012


Epoch 432: 2batch [00:00, 13.99batch/s, loss=778]

epoch 431: avg test  loss 834.32, bar  test loss 2.095, len  test loss 0.029, col  test loss 144.748


Epoch 432: 272batch [00:19, 14.06batch/s, loss=761]


epoch 432: avg train loss 767.45, bar train loss 1.715, len train loss 0.021, col train loss 132.942


Epoch 433: 1batch [00:00,  8.40batch/s, loss=761]

epoch 432: avg test  loss 833.97, bar  test loss 2.097, len  test loss 0.026, col  test loss 144.850


Epoch 433: 272batch [00:19, 13.96batch/s, loss=831]


epoch 433: avg train loss 767.41, bar train loss 1.717, len train loss 0.020, col train loss 132.930


Epoch 434: 2batch [00:00, 13.89batch/s, loss=781]

epoch 433: avg test  loss 834.10, bar  test loss 2.087, len  test loss 0.027, col  test loss 144.693


Epoch 434: 272batch [00:19, 14.01batch/s, loss=779]


epoch 434: avg train loss 767.22, bar train loss 1.714, len train loss 0.020, col train loss 132.883


Epoch 435: 2batch [00:00, 14.08batch/s, loss=755]

epoch 434: avg test  loss 833.78, bar  test loss 2.115, len  test loss 0.026, col  test loss 144.832


Epoch 435: 272batch [00:19, 14.04batch/s, loss=789]


epoch 435: avg train loss 767.17, bar train loss 1.715, len train loss 0.021, col train loss 132.866
epoch 435: avg test  loss 834.08, bar  test loss 2.109, len  test loss 0.029, col  test loss 144.754


Epoch 436: 272batch [00:19, 13.70batch/s, loss=780]


epoch 436: avg train loss 766.84, bar train loss 1.713, len train loss 0.021, col train loss 132.806


Epoch 437: 2batch [00:00, 14.08batch/s, loss=770]

epoch 436: avg test  loss 833.83, bar  test loss 2.100, len  test loss 0.026, col  test loss 144.768


Epoch 437: 272batch [00:19, 14.08batch/s, loss=755]


epoch 437: avg train loss 766.71, bar train loss 1.708, len train loss 0.020, col train loss 132.774


Epoch 438: 2batch [00:00, 13.89batch/s, loss=782]

epoch 437: avg test  loss 833.18, bar  test loss 2.107, len  test loss 0.026, col  test loss 144.693


Epoch 438: 272batch [00:19, 14.02batch/s, loss=738]


epoch 438: avg train loss 766.45, bar train loss 1.710, len train loss 0.021, col train loss 132.714


Epoch 439: 2batch [00:00, 12.99batch/s, loss=754]

epoch 438: avg test  loss 833.34, bar  test loss 2.106, len  test loss 0.026, col  test loss 144.719


Epoch 439: 272batch [00:19, 13.99batch/s, loss=817]


epoch 439: avg train loss 766.30, bar train loss 1.707, len train loss 0.020, col train loss 132.684


Epoch 440: 2batch [00:00, 13.42batch/s, loss=779]

epoch 439: avg test  loss 834.10, bar  test loss 2.088, len  test loss 0.029, col  test loss 144.633


Epoch 440: 272batch [00:19, 14.01batch/s, loss=750]


epoch 440: avg train loss 766.28, bar train loss 1.708, len train loss 0.020, col train loss 132.677
epoch 440: avg test  loss 833.41, bar  test loss 2.099, len  test loss 0.030, col  test loss 144.767


Epoch 441: 272batch [00:20, 13.55batch/s, loss=746]


epoch 441: avg train loss 766.05, bar train loss 1.707, len train loss 0.021, col train loss 132.633


Epoch 442: 2batch [00:00, 13.51batch/s, loss=809]

epoch 441: avg test  loss 833.58, bar  test loss 2.086, len  test loss 0.025, col  test loss 144.711


Epoch 442: 272batch [00:19, 13.98batch/s, loss=761]


epoch 442: avg train loss 765.99, bar train loss 1.705, len train loss 0.020, col train loss 132.614


Epoch 443: 2batch [00:00, 13.89batch/s, loss=716]

epoch 442: avg test  loss 834.08, bar  test loss 2.091, len  test loss 0.028, col  test loss 144.685


Epoch 443: 272batch [00:19, 13.96batch/s, loss=782]


epoch 443: avg train loss 765.82, bar train loss 1.702, len train loss 0.020, col train loss 132.584


Epoch 444: 2batch [00:00, 13.89batch/s, loss=799]

epoch 443: avg test  loss 833.86, bar  test loss 2.097, len  test loss 0.026, col  test loss 144.708


Epoch 444: 272batch [00:19, 13.98batch/s, loss=791]


epoch 444: avg train loss 765.47, bar train loss 1.700, len train loss 0.020, col train loss 132.512


Epoch 445: 2batch [00:00, 13.79batch/s, loss=787]

epoch 444: avg test  loss 833.08, bar  test loss 2.101, len  test loss 0.026, col  test loss 144.710


Epoch 445: 272batch [00:19, 13.99batch/s, loss=773]


epoch 445: avg train loss 765.42, bar train loss 1.700, len train loss 0.020, col train loss 132.502
epoch 445: avg test  loss 833.33, bar  test loss 2.116, len  test loss 0.026, col  test loss 144.755


Epoch 446: 272batch [00:20, 13.31batch/s, loss=763]


epoch 446: avg train loss 765.17, bar train loss 1.699, len train loss 0.020, col train loss 132.456


Epoch 447: 2batch [00:00, 13.33batch/s, loss=772]

epoch 446: avg test  loss 833.77, bar  test loss 2.093, len  test loss 0.025, col  test loss 144.598


Epoch 447: 272batch [00:19, 14.00batch/s, loss=849]


epoch 447: avg train loss 765.02, bar train loss 1.698, len train loss 0.020, col train loss 132.431


Epoch 448: 2batch [00:00, 14.49batch/s, loss=746]

epoch 447: avg test  loss 833.88, bar  test loss 2.102, len  test loss 0.030, col  test loss 144.704


Epoch 448: 272batch [00:20, 13.58batch/s, loss=749]


epoch 448: avg train loss 764.89, bar train loss 1.695, len train loss 0.020, col train loss 132.397


Epoch 449: 2batch [00:00, 12.90batch/s, loss=754]

epoch 448: avg test  loss 833.74, bar  test loss 2.095, len  test loss 0.026, col  test loss 144.717


Epoch 449: 272batch [00:20, 12.98batch/s, loss=766]


epoch 449: avg train loss 764.67, bar train loss 1.693, len train loss 0.020, col train loss 132.348


Epoch 450: 2batch [00:00, 12.99batch/s, loss=759]

epoch 449: avg test  loss 833.32, bar  test loss 2.088, len  test loss 0.026, col  test loss 144.688


Epoch 450: 272batch [00:23, 11.82batch/s, loss=808]


epoch 450: avg train loss 764.58, bar train loss 1.695, len train loss 0.020, col train loss 132.319
epoch 450: avg test  loss 833.80, bar  test loss 2.091, len  test loss 0.030, col  test loss 144.652


Epoch 451: 272batch [00:22, 12.01batch/s, loss=802]


epoch 451: avg train loss 764.46, bar train loss 1.694, len train loss 0.020, col train loss 132.280


Epoch 452: 0batch [00:00, ?batch/s]

epoch 451: avg test  loss 833.73, bar  test loss 2.091, len  test loss 0.026, col  test loss 144.609


Epoch 452: 272batch [00:21, 12.52batch/s, loss=749]


epoch 452: avg train loss 764.25, bar train loss 1.693, len train loss 0.020, col train loss 132.240


Epoch 453: 2batch [00:00, 13.25batch/s, loss=762]

epoch 452: avg test  loss 833.61, bar  test loss 2.098, len  test loss 0.027, col  test loss 144.594


Epoch 453: 272batch [00:21, 12.76batch/s, loss=785]


epoch 453: avg train loss 764.03, bar train loss 1.692, len train loss 0.020, col train loss 132.203


Epoch 454: 2batch [00:00, 12.90batch/s, loss=761]

epoch 453: avg test  loss 833.64, bar  test loss 2.089, len  test loss 0.027, col  test loss 144.588


Epoch 454: 272batch [00:21, 12.64batch/s, loss=747]


epoch 454: avg train loss 763.85, bar train loss 1.688, len train loss 0.020, col train loss 132.163


Epoch 455: 2batch [00:00, 12.99batch/s, loss=795]

epoch 454: avg test  loss 833.45, bar  test loss 2.093, len  test loss 0.026, col  test loss 144.599


Epoch 455: 272batch [00:21, 12.64batch/s, loss=793]


epoch 455: avg train loss 763.64, bar train loss 1.687, len train loss 0.020, col train loss 132.128
epoch 455: avg test  loss 833.94, bar  test loss 2.085, len  test loss 0.026, col  test loss 144.576


Epoch 456: 272batch [00:24, 11.12batch/s, loss=685]


epoch 456: avg train loss 763.54, bar train loss 1.686, len train loss 0.020, col train loss 132.100


Epoch 457: 0batch [00:00, ?batch/s, loss=752]

epoch 456: avg test  loss 833.75, bar  test loss 2.082, len  test loss 0.026, col  test loss 144.608


Epoch 457: 272batch [00:22, 12.08batch/s, loss=752]


epoch 457: avg train loss 763.44, bar train loss 1.685, len train loss 0.020, col train loss 132.080


Epoch 458: 2batch [00:00, 13.24batch/s, loss=744]

epoch 457: avg test  loss 833.30, bar  test loss 2.093, len  test loss 0.026, col  test loss 144.519


Epoch 458: 272batch [00:21, 12.70batch/s, loss=740]


epoch 458: avg train loss 763.46, bar train loss 1.687, len train loss 0.020, col train loss 132.067


Epoch 459: 2batch [00:00, 12.86batch/s, loss=787]

epoch 458: avg test  loss 833.53, bar  test loss 2.088, len  test loss 0.026, col  test loss 144.566


Epoch 459: 272batch [00:21, 12.72batch/s, loss=742]


epoch 459: avg train loss 763.24, bar train loss 1.684, len train loss 0.020, col train loss 132.037


Epoch 460: 2batch [00:00, 12.58batch/s, loss=774]

epoch 459: avg test  loss 833.63, bar  test loss 2.080, len  test loss 0.027, col  test loss 144.674


Epoch 460: 272batch [00:21, 12.63batch/s, loss=785]


epoch 460: avg train loss 762.99, bar train loss 1.683, len train loss 0.020, col train loss 131.982
epoch 460: avg test  loss 834.03, bar  test loss 2.082, len  test loss 0.025, col  test loss 144.554


Epoch 461: 272batch [00:22, 12.22batch/s, loss=780]


epoch 461: avg train loss 762.74, bar train loss 1.681, len train loss 0.020, col train loss 131.923


Epoch 462: 2batch [00:00, 12.50batch/s, loss=758]

epoch 461: avg test  loss 833.80, bar  test loss 2.101, len  test loss 0.026, col  test loss 144.609


Epoch 462: 272batch [00:21, 12.70batch/s, loss=797]


epoch 462: avg train loss 762.51, bar train loss 1.680, len train loss 0.020, col train loss 131.892


Epoch 463: 0batch [00:00, ?batch/s, loss=757]

epoch 462: avg test  loss 834.03, bar  test loss 2.090, len  test loss 0.026, col  test loss 144.501


Epoch 463: 272batch [00:21, 12.68batch/s, loss=712]


epoch 463: avg train loss 762.40, bar train loss 1.676, len train loss 0.020, col train loss 131.862


Epoch 464: 2batch [00:00, 12.99batch/s, loss=756]

epoch 463: avg test  loss 833.23, bar  test loss 2.094, len  test loss 0.025, col  test loss 144.515


Epoch 464: 272batch [00:21, 12.40batch/s, loss=741]


epoch 464: avg train loss 762.18, bar train loss 1.678, len train loss 0.020, col train loss 131.797


Epoch 465: 2batch [00:00, 13.07batch/s, loss=763]

epoch 464: avg test  loss 833.48, bar  test loss 2.075, len  test loss 0.025, col  test loss 144.485


Epoch 465: 272batch [00:21, 12.54batch/s, loss=696]


epoch 465: avg train loss 762.00, bar train loss 1.677, len train loss 0.020, col train loss 131.768
epoch 465: avg test  loss 833.94, bar  test loss 2.094, len  test loss 0.029, col  test loss 144.600


Epoch 466: 272batch [00:22, 12.19batch/s, loss=743]


epoch 466: avg train loss 761.90, bar train loss 1.672, len train loss 0.020, col train loss 131.765


Epoch 467: 2batch [00:00, 13.16batch/s, loss=734]

epoch 466: avg test  loss 833.84, bar  test loss 2.076, len  test loss 0.026, col  test loss 144.446


Epoch 467: 272batch [00:22, 12.14batch/s, loss=822]


epoch 467: avg train loss 761.68, bar train loss 1.675, len train loss 0.020, col train loss 131.709


Epoch 468: 2batch [00:00, 12.66batch/s, loss=761]

epoch 467: avg test  loss 833.45, bar  test loss 2.084, len  test loss 0.026, col  test loss 144.523


Epoch 468: 272batch [00:21, 12.53batch/s, loss=766]


epoch 468: avg train loss 761.58, bar train loss 1.673, len train loss 0.020, col train loss 131.693


Epoch 469: 2batch [00:00, 12.82batch/s, loss=735]

epoch 468: avg test  loss 833.82, bar  test loss 2.093, len  test loss 0.026, col  test loss 144.518


Epoch 469: 272batch [00:21, 12.65batch/s, loss=739]


epoch 469: avg train loss 761.49, bar train loss 1.671, len train loss 0.020, col train loss 131.657


Epoch 470: 2batch [00:00, 12.74batch/s, loss=773]

epoch 469: avg test  loss 833.44, bar  test loss 2.090, len  test loss 0.026, col  test loss 144.449


Epoch 470: 272batch [00:21, 12.70batch/s, loss=781]


epoch 470: avg train loss 761.42, bar train loss 1.669, len train loss 0.020, col train loss 131.645
epoch 470: avg test  loss 834.08, bar  test loss 2.098, len  test loss 0.031, col  test loss 144.560


Epoch 471: 272batch [00:22, 11.93batch/s, loss=783]


epoch 471: avg train loss 761.08, bar train loss 1.667, len train loss 0.020, col train loss 131.580


Epoch 472: 2batch [00:00, 12.99batch/s, loss=716]

epoch 471: avg test  loss 833.01, bar  test loss 2.088, len  test loss 0.026, col  test loss 144.482


Epoch 472: 272batch [00:21, 12.43batch/s, loss=780]


epoch 472: avg train loss 760.88, bar train loss 1.668, len train loss 0.020, col train loss 131.535


Epoch 473: 2batch [00:00, 12.58batch/s, loss=767]

epoch 472: avg test  loss 833.47, bar  test loss 2.075, len  test loss 0.026, col  test loss 144.446


Epoch 473: 272batch [00:20, 13.39batch/s, loss=759]


epoch 473: avg train loss 760.88, bar train loss 1.666, len train loss 0.020, col train loss 131.526


Epoch 474: 2batch [00:00, 12.35batch/s, loss=784]

epoch 473: avg test  loss 833.52, bar  test loss 2.081, len  test loss 0.027, col  test loss 144.482


Epoch 474: 272batch [00:21, 12.49batch/s, loss=743]


epoch 474: avg train loss 760.79, bar train loss 1.664, len train loss 0.020, col train loss 131.518


Epoch 475: 2batch [00:00, 12.20batch/s, loss=756]

epoch 474: avg test  loss 833.24, bar  test loss 2.075, len  test loss 0.026, col  test loss 144.472


Epoch 475: 272batch [00:21, 12.61batch/s, loss=686]


epoch 475: avg train loss 760.44, bar train loss 1.664, len train loss 0.020, col train loss 131.446
epoch 475: avg test  loss 833.65, bar  test loss 2.084, len  test loss 0.026, col  test loss 144.451


Epoch 476: 272batch [00:22, 12.11batch/s, loss=738]


epoch 476: avg train loss 760.41, bar train loss 1.664, len train loss 0.020, col train loss 131.422


Epoch 477: 2batch [00:00, 12.12batch/s, loss=783]

epoch 476: avg test  loss 833.84, bar  test loss 2.083, len  test loss 0.026, col  test loss 144.524


Epoch 477: 272batch [00:22, 12.04batch/s, loss=697]


epoch 477: avg train loss 760.17, bar train loss 1.662, len train loss 0.020, col train loss 131.385


Epoch 478: 2batch [00:00, 12.20batch/s, loss=753]

epoch 477: avg test  loss 833.69, bar  test loss 2.077, len  test loss 0.027, col  test loss 144.492


Epoch 478: 272batch [00:21, 12.50batch/s, loss=712]


epoch 478: avg train loss 760.19, bar train loss 1.662, len train loss 0.020, col train loss 131.388


Epoch 479: 0batch [00:00, ?batch/s, loss=743]

epoch 478: avg test  loss 833.69, bar  test loss 2.104, len  test loss 0.028, col  test loss 144.503


Epoch 479: 272batch [00:22, 12.12batch/s, loss=756]


epoch 479: avg train loss 759.91, bar train loss 1.661, len train loss 0.020, col train loss 131.323


Epoch 480: 2batch [00:00, 12.66batch/s, loss=781]

epoch 479: avg test  loss 833.80, bar  test loss 2.079, len  test loss 0.026, col  test loss 144.527


Epoch 480: 272batch [00:21, 12.61batch/s, loss=770]


epoch 480: avg train loss 759.73, bar train loss 1.658, len train loss 0.020, col train loss 131.311
epoch 480: avg test  loss 833.58, bar  test loss 2.099, len  test loss 0.027, col  test loss 144.449


Epoch 481: 272batch [00:21, 12.78batch/s, loss=747]


epoch 481: avg train loss 759.60, bar train loss 1.657, len train loss 0.020, col train loss 131.264


Epoch 482: 2batch [00:00, 13.07batch/s, loss=764]

epoch 481: avg test  loss 833.54, bar  test loss 2.080, len  test loss 0.028, col  test loss 144.478


Epoch 482: 272batch [00:20, 13.50batch/s, loss=725]


epoch 482: avg train loss 759.42, bar train loss 1.656, len train loss 0.020, col train loss 131.236


Epoch 483: 2batch [00:00, 13.42batch/s, loss=794]

epoch 482: avg test  loss 833.69, bar  test loss 2.076, len  test loss 0.026, col  test loss 144.356


Epoch 483: 272batch [00:20, 13.55batch/s, loss=777]


epoch 483: avg train loss 759.42, bar train loss 1.657, len train loss 0.019, col train loss 131.208


Epoch 484: 2batch [00:00, 12.90batch/s, loss=765]

epoch 483: avg test  loss 833.93, bar  test loss 2.115, len  test loss 0.032, col  test loss 144.438


Epoch 484: 272batch [00:19, 13.93batch/s, loss=704]


epoch 484: avg train loss 759.11, bar train loss 1.654, len train loss 0.020, col train loss 131.174


Epoch 485: 2batch [00:00, 13.16batch/s, loss=734]

epoch 484: avg test  loss 833.34, bar  test loss 2.087, len  test loss 0.026, col  test loss 144.524


Epoch 485: 272batch [00:19, 13.90batch/s, loss=736]


epoch 485: avg train loss 758.92, bar train loss 1.656, len train loss 0.020, col train loss 131.143
epoch 485: avg test  loss 833.61, bar  test loss 2.085, len  test loss 0.027, col  test loss 144.496


Epoch 486: 272batch [00:22, 12.01batch/s, loss=823]


epoch 486: avg train loss 758.99, bar train loss 1.655, len train loss 0.020, col train loss 131.126


Epoch 487: 2batch [00:00, 12.42batch/s, loss=726]

epoch 486: avg test  loss 833.03, bar  test loss 2.093, len  test loss 0.028, col  test loss 144.443


Epoch 487: 272batch [00:21, 12.62batch/s, loss=767]


epoch 487: avg train loss 758.69, bar train loss 1.650, len train loss 0.020, col train loss 131.084


Epoch 488: 2batch [00:00, 12.82batch/s, loss=759]

epoch 487: avg test  loss 833.22, bar  test loss 2.073, len  test loss 0.026, col  test loss 144.422


Epoch 488: 272batch [00:21, 12.52batch/s, loss=787]


epoch 488: avg train loss 758.58, bar train loss 1.651, len train loss 0.020, col train loss 131.045


Epoch 489: 2batch [00:00, 12.90batch/s, loss=777]

epoch 488: avg test  loss 833.55, bar  test loss 2.082, len  test loss 0.029, col  test loss 144.371


Epoch 489: 272batch [00:21, 12.51batch/s, loss=784]


epoch 489: avg train loss 758.39, bar train loss 1.648, len train loss 0.020, col train loss 131.026


Epoch 490: 2batch [00:00, 12.35batch/s, loss=791]

epoch 489: avg test  loss 833.80, bar  test loss 2.084, len  test loss 0.028, col  test loss 144.350


Epoch 490: 272batch [00:21, 12.37batch/s, loss=766]


epoch 490: avg train loss 758.45, bar train loss 1.651, len train loss 0.020, col train loss 131.003
epoch 490: avg test  loss 833.85, bar  test loss 2.076, len  test loss 0.025, col  test loss 144.362


Epoch 491: 272batch [00:23, 11.75batch/s, loss=751]


epoch 491: avg train loss 758.26, bar train loss 1.650, len train loss 0.019, col train loss 130.965


Epoch 492: 2batch [00:00, 12.50batch/s, loss=750]

epoch 491: avg test  loss 833.53, bar  test loss 2.077, len  test loss 0.027, col  test loss 144.399


Epoch 492: 272batch [00:22, 12.08batch/s, loss=779]


epoch 492: avg train loss 758.05, bar train loss 1.647, len train loss 0.020, col train loss 130.927


Epoch 493: 2batch [00:00, 11.56batch/s, loss=752]

epoch 492: avg test  loss 833.62, bar  test loss 2.072, len  test loss 0.027, col  test loss 144.403


Epoch 493: 272batch [00:22, 12.27batch/s, loss=823]


epoch 493: avg train loss 757.87, bar train loss 1.647, len train loss 0.020, col train loss 130.910


Epoch 494: 0batch [00:00, ?batch/s]

epoch 493: avg test  loss 834.27, bar  test loss 2.079, len  test loss 0.026, col  test loss 144.338


Epoch 494: 272batch [00:24, 11.03batch/s, loss=773]


epoch 494: avg train loss 757.75, bar train loss 1.643, len train loss 0.020, col train loss 130.864


Epoch 495: 2batch [00:00, 12.12batch/s, loss=760]

epoch 494: avg test  loss 833.55, bar  test loss 2.081, len  test loss 0.027, col  test loss 144.417


Epoch 495: 272batch [00:22, 11.87batch/s, loss=700]


epoch 495: avg train loss 757.55, bar train loss 1.643, len train loss 0.019, col train loss 130.845
epoch 495: avg test  loss 833.40, bar  test loss 2.074, len  test loss 0.026, col  test loss 144.417


Epoch 496: 272batch [00:23, 11.78batch/s, loss=827]


epoch 496: avg train loss 757.58, bar train loss 1.643, len train loss 0.020, col train loss 130.827


Epoch 497: 2batch [00:00, 12.20batch/s, loss=779]

epoch 496: avg test  loss 833.58, bar  test loss 2.078, len  test loss 0.026, col  test loss 144.320


Epoch 497: 272batch [00:22, 12.26batch/s, loss=766]


epoch 497: avg train loss 757.43, bar train loss 1.643, len train loss 0.020, col train loss 130.794


Epoch 498: 2batch [00:00, 12.50batch/s, loss=742]

epoch 497: avg test  loss 833.79, bar  test loss 2.072, len  test loss 0.028, col  test loss 144.453


Epoch 498: 272batch [00:22, 12.00batch/s, loss=863]


epoch 498: avg train loss 757.15, bar train loss 1.644, len train loss 0.020, col train loss 130.729


Epoch 499: 2batch [00:00, 12.20batch/s, loss=750]

epoch 498: avg test  loss 833.58, bar  test loss 2.083, len  test loss 0.030, col  test loss 144.425


Epoch 499: 272batch [00:22, 12.24batch/s, loss=771]


epoch 499: avg train loss 757.08, bar train loss 1.639, len train loss 0.019, col train loss 130.715


Epoch 500: 0batch [00:00, ?batch/s]

epoch 499: avg test  loss 833.73, bar  test loss 2.080, len  test loss 0.025, col  test loss 144.371


Epoch 500: 272batch [00:22, 12.16batch/s, loss=803]


epoch 500: avg train loss 756.87, bar train loss 1.638, len train loss 0.019, col train loss 130.700
epoch 500: avg test  loss 833.94, bar  test loss 2.074, len  test loss 0.025, col  test loss 144.305


In [None]:
lss2, lss_t2 = train(default_args, train_loader, test_loader, diva, optimizer, 1000, 500, save_folder="VAEFC")

In [None]:
lss, lss_t = train(default_args, train_loader, test_loader, diva, optimizer, 5600, 2200, save_folder="VAE4")

In [None]:
def plot_loss_acc(lss, lss_t):
    fig,ax = plt.subplots()
    ax.plot(lss, label="train loss")
    ax.plot(lss_t, label = "test loss")
    #ax1 = ax.twinx()
    #ax1.plot(yacc, label = "train accuracy", ls='--')
    #ax1.plot(yacc_t, label = "test accuracy", ls='--')

    lines, labels = ax.get_legend_handles_labels()
    #lines2, labels2 = ax1.get_legend_handles_labels()

    ax.legend(lines, labels)

In [None]:
plot_loss_acc(lss, lss_t)

In [None]:
plot_loss_acc(lss3, lss_t3, yacc3, yacc_t3)

In [None]:
def plot_change_latent_var(diva, lat_space="y", var_idx=[0,1,2,3,4,5,6,7], step = 5):
    a = next(enumerate(test_loader))
    with torch.no_grad():
        diva.eval()
        d = a[1][2][:len(var_idx)].to(DEVICE).float()
        x = a[1][0][:len(var_idx)].to(DEVICE).float()
        y = a[1][1][:len(var_idx)].to(DEVICE).float()

        zx, zx_sc = diva.qzx(x)
        zy, zy_sc = diva.qzy(x)
        zd, zd_sc =  diva.qzd(x)

        print(torch.max(zy), torch.min(zy), "sdmax:", torch.max(zy_sc))

        out = change(zx, zy, zd, var_idx, lat_space, diva, step)
    
    fig, ax = plt.subplots(ncols=out.shape[0],nrows=len(var_idx),figsize=(10*4*out.shape[0],10*len(var_idx)))
    for i in range(out.shape[0]):
      for j in range(len(var_idx)):
        ax[j,i].imshow(out[i,j])

In [None]:
def change(zx, zy, zd, idx, lat = "y", model=diva, step = 2):
    
    dif = np.arange(-30,15,step)
    print(torch.max(zy), torch.min(zy))
    out = np.zeros((dif.shape[0], len(idx), 25, 100 ,3))  
    #print(zy.shape, dif.shape[0])
    for i in range(dif.shape[0]):
      for j in range(len(idx)):
        if lat == "y":
            zy[j,idx] = dif[i]
        elif lat == "x":
            zx[j,idx] = dif[i]
        elif lat == "d":
            zd[j,idx] = dif[i]
        len_, bar, col = model.px(zd[j],zx[j],zy[j])
        out[i,j] = model.px.reconstruct_image(len_[None,:], bar, col)
    
    return out



In [None]:
plot_change_latent_var(diva)

In [None]:
fig,ax = plt.subplots()
ax.plot(np.arange(50,120), [i.cpu().detach().numpy() for i in lss2], label="train loss")
ax.plot(np.arange(50,120), [i.cpu().detach().numpy() for i in lss_t2], label = "testloss")
ax1 = ax.twinx()
ax1.plot(np.arange(50,120), yacc2, label = "train")
ax1.plot(np.arange(50,120), yacc_t2, label = "test")

plt.legend()

In [None]:
fig,ax = plt.subplots()
ax.plot(np.arange(120,180), [i.cpu().detach().numpy() for i in lss3], label="train loss")
ax.plot(np.arange(120,180), [i.cpu().detach().numpy() for i in lss_t3], label = "testloss")
ax1 = ax.twinx()
ax1.plot(np.arange(120,180), yacc3, label = "train",c='green')
ax1.plot(np.arange(120,180), yacc_t3, label = "test")

plt.legend()

# Model Evaluation

## Sampling from trained model

In [None]:
def plot_latent_space(lat_space="y"):
    '''
    lat_space: y, d, x
    '''

    

In [None]:
plot(x, out, 0)

In [None]:
fig, ax = plt.subplots(nrows=3, ncols=3)
for i in range(9):
  ax[i//3, i%3].imshow(x[i].cpu().permute(1,2,0))
  
plt.savefig('divastamporg.png')