In [1]:
link = 'D:/users/Marko/downloads/mirna/'

# Imports

In [2]:
%load_ext tensorboard

In [8]:
import sys
#sys.path.insert(0,'/content/drive/MyDrive/Marko/master')
sys.path.insert(0, link)
import numpy as np
import matplotlib.pyplot as plt

#import tensorflow as tf

import torch
import torch.optim as optim
import torch.nn as nn
import torch.distributions as dist

from torch.nn import functional as F
from torchinfo import summary
from torch.utils.tensorboard import SummaryWriter
from torch.utils.data import Dataset, DataLoader

from sklearn.preprocessing import OneHotEncoder

from tqdm import tqdm
from tqdm import trange

import datetime


writer = SummaryWriter(f"{link}/saved_models/VAE11/tensorboard")

In [9]:
DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu")

In [10]:
DEVICE

device(type='cuda')

# Model Classes

In [11]:
class diva_args:

    def __init__(self, z_dim=64, d_dim=45, x_dim=7500, y_dim=2,
                 beta=10, rec_alpha = 1, rec_beta = 1, 
                 rec_gamma = 1, warmup = 1, prewarmup = 1):

        self.z_dim = z_dim
        self.d_dim = d_dim
        self.x_dim = x_dim
        self.y_dim = y_dim
        
        self.beta = beta
        self.rec_alpha = rec_alpha
        self.rec_beta = rec_beta
        self.rec_gamma = rec_gamma
        self.warmup = warmup
        self.prewarmup = prewarmup


## Dataset Class

In [12]:
class MicroRNADataset(Dataset):

    def __init__(self, ds='train', create_encodings=False):
        
        # loading images
        self.images = np.load(f'{link}/data/modmirbase_{ds}_images.npz')['arr_0']/255
        
        
        # loading labels
        print('Loading Labels! (~10s)')     
        ohe = OneHotEncoder(categories='auto', sparse=False)
        labels = np.load(f'{link}/data/modmirbase_{ds}_labels.npz')['arr_0']
        self.labels = ohe.fit_transform(labels)
        
        # loading encoded images
        print("loading encodings")
        if create_encodings:
            x_len, x_col, x_bar = self.get_encoded_values(self.images, ds)
        else:
            x_len = np.load(f'{link}/data/modmirbase_{ds}_images_len2.npz')
            x_bar = np.load(f'{link}/data/modmirbase_{ds}_images_bar2.npz')
            x_col = np.load(f'{link}/data/modmirbase_{ds}_images_col2.npz')
        
        self.x_len = x_len
        self.x_bar = x_bar
        self.x_col = x_col
        

        # loading names
        print('Loading Names! (~5s)')
        names =  np.load(f'{link}/data/modmirbase_{ds}_names.npz')['arr_0']
        names = [i.decode('utf-8') for i in names]
        self.species = ['mmu', 'prd', 'hsa', 'ptr', 'efu', 'cbn', 'gma', 'pma',
                        'cel', 'gga', 'ipu', 'ptc', 'mdo', 'cgr', 'bta', 'cin', 
                        'ppy', 'ssc', 'ath', 'cfa', 'osa', 'mtr', 'gra', 'mml',
                        'stu', 'bdi', 'rno', 'oan', 'dre', 'aca', 'eca', 'chi',
                        'bmo', 'ggo', 'aly', 'dps', 'mdm', 'ame', 'ppc', 'ssa',
                        'ppt', 'tca', 'dme', 'sbi']
        # assigning a species label to each observation from species
        # with more than 200 observations from past research
        self.names = []
        for i in names:
            append = False
            for j in self.species:
                if j in i.lower():
                    self.names.append(j)
                    append = True
                    break
            if not append:
                if 'random' in i.lower() or i.isdigit():
                    self.names.append('hsa')
                else:
                    self.names.append('notfound')
        
        # performing one hot encoding
        ohe = OneHotEncoder(categories='auto', sparse=False)
        self.names_ohe = ohe.fit_transform(np.array(self.names).reshape(-1,1))
      
    def __len__(self):
        return(self.images.shape[0])

    def __getitem__(self, idx):
        d = self.names_ohe[idx]
        y = self.labels[idx]
        x = self.images[idx]
        x = np.transpose(x, (2,0,1))
        x_len = self.x_len[idx]
        x_col = self.x_col[idx]
        x_bar = self.x_bar[idx]
        return (x, y, d, x_len, x_col, x_bar)


    def get_encoded_values(self, x, ds):
        """
        given an image or batch of images
        returns length of strand, length of bars and colors of bars
        """
        n = x.shape[0]
        x = np.transpose(x, (0,3,1,2))
        out_len = np.zeros((n), dtype=np.uint8)
        out_col = np.zeros((n,5,200), dtype=np.uint8)
        out_bar = np.zeros((n,2,100), dtype=np.uint8)

        for i in range(n):
            if i % 100 == 0:
                print(f'at {i} out of {n}')
            rna_len = 0
            broke = False
            for j in range(100):
                if (x[i,:,12,j] == np.array([1,1,1])).all():
                    out_len[i] = rna_len
                    broke = True
                    break
                else:
                    rna_len += 1
                    # check color of bars
                    out_col[i, self.get_color(x[i,:,12,j]) ,2*j] = 1 
                    out_col[i, self.get_color(x[i,:,13,j]), 2*j+1] = 1
                    # check length of bars
                    len1 = 0
                    # loop until white pixel
                    while not (x[i,:,12-len1,j] == np.array([1.,1.,1.])).all():
                        len1 += 1
                        if 13-len1 == 0:
                            break
                    out_bar[i, 0, j] = len1

                    len2 = 0
                    while not (x[i,:,13+len2,j] == np.array([1.,1.,1.])).all():
                        len2 += 1
                        if 13+len2 == 25:
                            break
                    out_bar[i, 1, j] = len2
            if not broke:
                out_len[i] = rna_len


        with open(f'{link}/data/modmirbase_{ds}_images_len2.npz', 'wb') as f:
            np.save(f, out_len)
        with open(f'{link}/data/modmirbase_{ds}_images_col2.npz', 'wb') as f:
            np.save(f, out_col)
        with open(f'{link}/data/modmirbase_{ds}_images_bar2.npz', 'wb') as f:
            np.save(f, out_bar)
        

        return out_len, out_bar, out_col

    def get_color(self, pixel):
        """
        returns the encoded value for a pixel
        """
        if (pixel == np.array([0,0,0])).all():  
            return 0 # black
        elif (pixel == np.array([1,0,0])).all():  
            return 1 # red
        elif (pixel == np.array([0,0,1])).all():  
            return 2 # blue
        elif (pixel == np.array([0,1,0])).all():  
            return 3 # green
        elif (pixel == np.array([1,1,0])).all():  
            return 4 # yellow
        else:
            print("Something wrong!")


## Decoder classes

In [13]:
# Decoders
class px(nn.Module):
    def __init__(self, d_dim, x_dim, y_dim, z_dim):
        super(px, self).__init__()

        self.fc1 = nn.Sequential(nn.Linear(z_dim, 1600, bias=False),  
                                 nn.ReLU())
        
        self.fc2 = nn.Sequential(nn.Linear(1600, 1000, bias=False),  
                                 nn.ReLU())
        # Predicting length and color of each bar
        self.up1 = nn.Upsample(scale_factor=5)
        self.de1 = nn.Sequential(nn.ConvTranspose1d(50,100,kernel_size = 5,
                                                    stride = 1, padding = 2),
                                 nn.ReLU(),)
        self.up2 = nn.Upsample(scale_factor=2)
        self.de2 = nn.Sequential(
                                 nn.ConvTranspose1d(100,100,kernel_size = 5,
                                                    stride = 1, padding = 2),
                                 nn.ReLU(),
                                 )
        # Predicting color of each bar
        self.color_bar = nn.Sequential(nn.Conv1d(100,5, kernel_size = 9, padding = 'same', padding_mode='reflect'),
                                      nn.Softmax(dim=1))
        
        # Predicting the length of each bar
        self.length_bar = nn.Sequential(nn.Conv1d(100, 2, kernel_size = 9, padding = 4, padding_mode='reflect', stride=2), nn.Softplus())
        #self.length_bar_scale = nn.Sequential(nn.Conv1d(100, 1, kernel_size = 3, padding = 'same', bias=False), nn.Sigmoid())
        # Predicting length of the RNA strand
        self.length_RNA = nn.Sequential(nn.Linear(1000,400), nn.ReLU(),nn.Linear(400,1), nn.Softplus())
        #self.length_RNA_scale = nn.Sequential(nn.Linear(400,1, bias=False), nn.Sigmoid())
        
    def forward(self, z):
        
        h = self.fc1(z)
        h = self.fc2(h)
        
        len_RNA = self.length_RNA(h)
        
        len_RNA_sc = nn.Parameter(torch.tensor([1.])).to(DEVICE)
        #len_RNA_sc = torch.exp(self.length_RNA_scale(h))
        
        h = h.view(-1, 50, 20)
        h = self.up1(h)
        h = self.de1(h)
        h = self.up2(h)
        h = self.de2(h)
        len_bar = self.length_bar(h)
        len_bar_sc = nn.Parameter(torch.tensor([1.])).to(DEVICE)
        #len_bar_sc = torch.exp(self.length_bar_scale(h))
        
        
        col_bar = self.color_bar(h)
        
        
        return len_RNA, len_RNA_sc, len_bar, len_bar_sc, col_bar

    def reconstruct_image(self, len_RNA, var_RNA, len_bar, var_bar ,col_bar, sample=False):
        """
        reconstructs RNA image given output from decoder
        even indexes of len_bar and col_bar   -> top
        uneven indexes of len_bar and col_bar -> bottom
        function does not support sampling yet
        color reconstructions: 0: black
                               1: red
                               2: blue
                               3: green
                               4: yellow
        """
        color_dict = {
                  0: np.array([0,0,0]), # black
                  1: np.array([1,0,0]), # red
                  3: np.array([0,1,0]), # green
                  2: np.array([0,0,1]), # blue
                  4: np.array([1,1,0])  # yellow
                  }
    
        
        len_RNA = len_RNA.cpu().numpy()
        var_RNA = var_RNA.cpu().numpy()
        #.reshape((100,))
        len_bar = len_bar.cpu().numpy()
        var_bar = var_bar.cpu().numpy()
        col_bar = col_bar.cpu().numpy()
        n = len_RNA.shape[0]
        output = np.ones((n,25,100,3))

        for i in range(n):
            if sample:
                limit = int(np.round(np.random.normal(loc=len_RNA[i], scale=var_RNA[i])))
            else:
                limit = int(np.round(len_RNA[i]))
            limit = min(100, limit)
            for j in range(limit):
                if sample:
                    _len_bar_1 = int(np.round(np.random.normal(loc=len_bar[i,0,j], scale=var_bar[i,0,j])))
                    _len_bar_2 = int(np.round(np.random.normal(loc=len_bar[i,1,j], scale=var_bar[i,1,j])))
                    _col_bar_1 = np.random.choice(np.arange(5), p = col_bar[i, :, 2*j])
                    _col_bar_2 = np.random.choice(np.arange(5), p = col_bar[i,:, 2*j+1])
                else:
                    _len_bar_1 = int(np.round(len_bar[i,0,j])) 
                    _len_bar_2 = int(np.round(len_bar[i,1,j]))
                    _col_bar_1 = np.argmax(col_bar[i,:, 2*j])
                    _col_bar_2 = np.argmax(col_bar[i,:, 2*j+1])
                
                h1 = max(0,13-_len_bar_1)
                # paint upper bar
                output[i, h1:13, j] = color_dict[_col_bar_1]
                h2 = min(25,13+_len_bar_2)
                # paint lower bar
                output[i, 13:h2, j] = color_dict[_col_bar_2]
        
        
        return output


In [14]:
int(np.round(3.7, 0))
int(3.7)

3

In [15]:
# pzy_ = pzy(45, 7500, 2, 32,32,32)
# summary(pzy_, (1,2))
# pzy_ = px(45, 7500, 2, 32,32,32)
# summary(pzy_, [(1,32),(1,32),(1,32)])

## Endcoder Classes

In [16]:
#pzy_.reconstruct_image(torch.zeros((1,100)), torch.zeros((1,13,200)), torch.zeros(1,5,200)).shape

In [17]:
class qz(nn.Module):
    def __init__(self, d_dim, x_dim, y_dim, z_dim):
        super(qz, self).__init__()

        self.encoder = nn.Sequential(
            nn.Conv2d(3, 64, kernel_size=5, stride=1, padding = 'same',bias=False),
            nn.ReLU(),
            nn.MaxPool2d(2, 2),
            nn.Conv2d(64, 128, kernel_size=3, stride=1, padding = 'same', bias=False),
            nn.ReLU(), 
            nn.MaxPool2d(2, 2),
            nn.Conv2d(128, 256, kernel_size=3, stride=1, bias=False),
            nn.ReLU(), 
            nn.MaxPool2d(2, 2),
        )

        self.fc11 = nn.Sequential(nn.Linear(5632, z_dim))
        self.fc12 = nn.Sequential(nn.Linear(5632, z_dim), nn.Softplus())

        torch.nn.init.xavier_uniform_(self.encoder[0].weight)
        torch.nn.init.xavier_uniform_(self.encoder[3].weight)
        torch.nn.init.xavier_uniform_(self.fc11[0].weight)
        self.fc11[0].bias.data.zero_()
        torch.nn.init.xavier_uniform_(self.fc12[0].weight)
        self.fc12[0].bias.data.zero_()

    def forward(self, x):
        h = self.encoder(x)
        h = h.view(-1, 5632)
        z_loc = self.fc11(h)
        z_scale = self.fc12(h) + 1e-7

        return z_loc, z_scale




In [18]:
enc = qz(128,10,10,10)
summary(enc, (1,3,25,100))

Layer (type:depth-idx)                   Output Shape              Param #
qz                                       --                        --
├─Sequential: 1-1                        [1, 256, 2, 11]           --
│    └─Conv2d: 2-1                       [1, 64, 25, 100]          4,800
│    └─ReLU: 2-2                         [1, 64, 25, 100]          --
│    └─MaxPool2d: 2-3                    [1, 64, 12, 50]           --
│    └─Conv2d: 2-4                       [1, 128, 12, 50]          73,728
│    └─ReLU: 2-5                         [1, 128, 12, 50]          --
│    └─MaxPool2d: 2-6                    [1, 128, 6, 25]           --
│    └─Conv2d: 2-7                       [1, 256, 4, 23]           294,912
│    └─ReLU: 2-8                         [1, 256, 4, 23]           --
│    └─MaxPool2d: 2-9                    [1, 256, 2, 11]           --
├─Sequential: 1-2                        [1, 10]                   --
│    └─Linear: 2-10                      [1, 10]                   56,330

## Full model class

In [28]:
class StampDIVA(nn.Module):
    def __init__(self, args):
        super(StampDIVA, self).__init__()
        self.z_dim = args.z_dim
        self.d_dim = args.d_dim
        self.x_dim = args.x_dim
        self.y_dim = args.y_dim

        self.px = px(self.d_dim, self.x_dim, self.y_dim, self.z_dim)
        
        self.qz = qz(self.d_dim, self.x_dim, self.y_dim, self.z_dim)
        

        self.beta = args.beta
        
        self.rec_alpha = args.rec_alpha
        self.rec_beta = args.rec_beta
        self.rec_gamma = args.rec_gamma

        self.warmup = args.warmup
        self.prewarmup = args.prewarmup

        self.cuda()

    def forward(self, d, x, y):
        # Encode
        zd_q_loc, zd_q_scale = self.qz(x)
        
        # Reparameterization trick
        qz = dist.Normal(zd_q_loc, zd_q_scale)
        z_q = qz.rsample()
        
        
        # Decode
        x_len, x_len_scale, x_bar, x_bar_scale, x_col = self.px(z_q)
        z_p_loc, z_p_scale = torch.zeros(z_q.size()[0], self.z_dim).cuda(),\
                        torch.ones(z_q.size()[0], self.z_dim).cuda()
        pz = dist.Normal(z_p_loc, z_p_scale)

        # Reparameterization trick
        pz = dist.Normal(z_p_loc, z_p_scale)
        
        return x_len, x_len_scale, x_bar, x_bar_scale, x_col, qz, pz, z_q

    def loss_function(self, d, x, y, out_len, out_bar, out_col):
        
        x_len, x_len_scale, x_bar, x_bar_scale, x_col, qz, pz, z_q = self.forward(d, x, y)
        mask = 1 - F.one_hot(torch.round(out_len).to(torch.int64)*2-1, 200).cumsum(dim=1)[:,None,:]
        mask1 = (1 - F.one_hot(torch.round(out_len).to(torch.int64)-1, 100).cumsum(dim=1)[:,None,:]).repeat(1,2,1)

        
        #x_bar = mask.repeat(1,1,1)*x_bar
        
        #x_bar_scale = mask.repeat(1,1,1)*x_bar_scale
        x_col = mask.repeat(1,5,1)*x_col
        
        
        dist_len = dist.Normal(x_len, x_len_scale+1e-7)
        log_len = dist_len.log_prob(out_len[:,None]).mean()
        
       # dist_bar = dist.Normal(x_bar, x_bar_scale+1e-7)
        #log_bar = dist_bar.log_prob(out_bar)*mask1
        #log_bar = (log_bar).sum(dim=(1,2)).mean()
        
        mse_bar = ((((x_bar - out_bar)**2)*mask1).sum(dim=(1,2))/(mask1.sum(dim=(1,2)))).sum()#.detach().item()
        
        max_bar = torch.argmax(x_col, dim=1)
        #acc_bar = (((max_bar==out_col)*mask).sum(dim=(1,2))/mask.sum(dim=(1,2))).sum().detach().item()/5
        acc_bar = (max_bar==torch.argmax(out_col, dim=1)).sum().float()
        
        CE_len = -log_len
        CE_bar = mse_bar#-log_bar
        CE_col = F.cross_entropy(x_col, out_col, reduction='sum')

        KL_z = torch.sum(pz.log_prob(z_q) - qz.log_prob(z_q))
          
        return self.rec_alpha * CE_len \
                  + self.rec_beta * CE_bar \
                  + self.rec_gamma * CE_col \
                  - self.beta * KL_z, \
                  CE_bar, CE_len, CE_col, mse_bar, acc_bar

In [29]:
default_args = diva_args(z_dim=1600, rec_alpha = 10, rec_beta = 10, rec_gamma = 10, 
                         beta=1, warmup=1, prewarmup=0)
enc = StampDIVA(default_args)
summary(enc,[ (1,1),(1,3,25,100),(1,1)])

Layer (type:depth-idx)                   Output Shape              Param #
StampDIVA                                --                        --
├─qz: 1-1                                [1, 1600]                 --
│    └─Sequential: 2-1                   [1, 256, 2, 11]           --
│    │    └─Conv2d: 3-1                  [1, 64, 25, 100]          4,800
│    │    └─ReLU: 3-2                    [1, 64, 25, 100]          --
│    │    └─MaxPool2d: 3-3               [1, 64, 12, 50]           --
│    │    └─Conv2d: 3-4                  [1, 128, 12, 50]          73,728
│    │    └─ReLU: 3-5                    [1, 128, 12, 50]          --
│    │    └─MaxPool2d: 3-6               [1, 128, 6, 25]           --
│    │    └─Conv2d: 3-7                  [1, 256, 4, 23]           294,912
│    │    └─ReLU: 3-8                    [1, 256, 4, 23]           --
│    │    └─MaxPool2d: 3-9               [1, 256, 2, 11]           --
│    └─Sequential: 2-2                   [1, 1600]                 --
│  

# Training the model

## Loading dataset

In [30]:
RNA_dataset = MicroRNADataset(create_encodings=False)

Loading Labels! (~10s)
loading encodings
Loading Names! (~5s)


In [31]:
RNA_dataset_test = MicroRNADataset('test', create_encodings=False)

Loading Labels! (~10s)
loading encodings
Loading Names! (~5s)


In [32]:
def train_single_epoch(train_loader, model, optimizer, epoch):
    model.train()
    train_loss = 0
    epoch_bar_loss = 0
    epoch_col_loss = 0
    epoch_len_loss = 0
    no_batches = 0
    train_corr = 0
    mse_bar = 0
    acc_bar = 0
    pbar = tqdm(enumerate(train_loader), unit="batch", 
                                     desc=f'Epoch {epoch}')
    for batch_idx, (x, y, d, x_len, x_col, x_bar) in pbar:
        # To device
        x, y, d , x_len, x_bar, x_col = x.to(DEVICE), y.to(DEVICE), d.to(DEVICE), x_len.to(DEVICE), x_bar.to(DEVICE), x_col.to(DEVICE)

        optimizer.zero_grad()
        loss, bar_loss, len_loss, col_loss, mse, acc = model.loss_function(d.float(), x.float(), y.float(), x_len.float(), x_bar.float(), x_col.float())
      
        loss.backward()
        optimizer.step()
        pbar.set_postfix(loss=loss.item()/x.shape[0])
        train_loss += loss
        epoch_bar_loss += bar_loss
        epoch_col_loss += col_loss
        epoch_len_loss += len_loss
        mse_bar += mse
        acc_bar += acc
        no_batches += 1

    train_loss /= len(train_loader.dataset)
    epoch_bar_loss /= len(train_loader.dataset)
    epoch_len_loss /= len(train_loader.dataset)
    epoch_col_loss /= len(train_loader.dataset)
    acc_bar /= len(train_loader.dataset)
    mse_bar /= len(train_loader.dataset)
    
    return train_loss, epoch_bar_loss, epoch_len_loss, epoch_col_loss, mse_bar, acc_bar

In [33]:
def test_single_epoch(test_loader, model, epoch):
    model.eval()
    test_loss = 0
    epoch_bar_loss = 0
    epoch_col_loss = 0
    epoch_len_loss = 0
    mse_bar = 0
    acc_bar = 0        
    with torch.no_grad():
        for batch_idx, (x,y,d,x_len,x_col,x_bar) in enumerate(test_loader):
            x, y, d, x_len, x_bar, x_col = x.to(DEVICE), y.to(DEVICE), d.to(DEVICE), x_len.to(DEVICE), x_bar.to(DEVICE), x_col.to(DEVICE)
            loss, bar_loss, len_loss, col_loss, mse, acc = model.loss_function(d.float(), x.float(), y.float(),x_len.float(),x_bar.float(),x_col.float())
            test_loss += loss
            epoch_bar_loss += bar_loss
            epoch_col_loss += col_loss
            epoch_len_loss += len_loss
            mse_bar += mse
            acc_bar += acc
    test_loss /= len(test_loader.dataset)
    epoch_bar_loss /= len(test_loader.dataset)
    epoch_len_loss /= len(test_loader.dataset)
    epoch_col_loss /= len(test_loader.dataset)
    acc_bar /= len(test_loader.dataset)
    mse_bar /= len(test_loader.dataset)
    
    return test_loss, epoch_bar_loss, epoch_len_loss, epoch_col_loss, mse_bar, acc_bar
  

In [34]:
def train(args, train_loader, test_loader, diva, optimizer, end_epoch, start_epoch=0, save_folder='sd_1.0.0',save_interval=5):
    
    epoch_loss_sup = []
    test_loss = []
    
    for epoch in range(start_epoch+1, end_epoch+1):
        diva.beta = min([args.beta, args.beta * (epoch - args.prewarmup * 1.) / (args.warmup)])
        if epoch< args.prewarmup:
            diva.beta = args.beta/args.prewarmup
        train_loss, avg_loss_bar, avg_loss_len, avg_loss_col, mtr, atr = train_single_epoch(train_loader, diva, optimizer, epoch)
        str_loss_sup = train_loss
        epoch_loss_sup.append(train_loss)
        str_print = "epoch {}: avg train loss {:.2f}".format(epoch, str_loss_sup)
        str_print += ", bar train loss {:.3f}".format(avg_loss_bar)
        str_print += ", len train loss {:.3f}".format(avg_loss_len)
        str_print += ", col train loss {:.3f}".format(avg_loss_col)
        print(str_print)

        rec_loss_train = diva.rec_alpha * avg_loss_len + diva.rec_beta * avg_loss_bar + diva.rec_gamma * avg_loss_col
        dis_loss_train = train_loss - rec_loss_train

        test_lss, avg_loss_bar_test, avg_loss_len_test, avg_loss_col_test, mte, ate = test_single_epoch(test_loader, diva, epoch)
        test_loss.append(test_lss)
       
        str_print = "epoch {}: avg test  loss {:.2f}".format(epoch, test_lss)
        str_print += ", bar  test loss {:.3f}".format(avg_loss_bar_test)
        str_print += ", len  test loss {:.3f}".format(avg_loss_len_test)
        str_print += ", col  test loss {:.3f}".format(avg_loss_col_test)
        print(str_print)

        rec_loss_test = diva.rec_alpha * avg_loss_len_test + diva.rec_beta * avg_loss_bar_test + diva.rec_gamma * avg_loss_col_test
        dis_loss_test = test_lss - rec_loss_test

        if writer is not None:
            
            writer.add_scalars("Total_Loss", {'train': train_loss, 'test': test_lss} ,epoch)
            writer.add_scalars("Reconstruction_vs_Disentanglement",{'rec':rec_loss_train, 'dis':dis_loss_train}, epoch)
            writer.add_scalars("bar_mse",{'train': mtr, 'test':mte}, epoch)
            writer.add_scalars("bar_acc",{'train': atr, 'test':ate}, epoch)

        if epoch % save_interval == 0:
            torch.save(diva.state_dict(), f'{link}/saved_models/{save_folder}/checkpoints/{epoch}.pth')
            save_reconstructions(epoch, test_loader, diva, name=save_folder)
            save_reconstructions(epoch, train_loader, diva, name=save_folder, estr='tr')


    if writer is not None:
        writer.flush()

    epoch_loss_sup = [i.cpu().detach().numpy() for i in epoch_loss_sup]
    test_loss = [i.cpu().detach().numpy() for i in test_loss]
    return epoch_loss_sup, test_loss

In [35]:
def save_reconstructions(epoch, test_loader, diva, name='diva', estr=''):
    a = next(enumerate(test_loader))
    with torch.no_grad():
        diva.eval()
        d = a[1][2][:10].to(DEVICE).float()
        x = a[1][0][:10].to(DEVICE).float()
        y = a[1][1][:10].to(DEVICE).float()
        x_1, x_1var, x_2, x_2var, x_3, _, _, _ = diva(d,x,y)
        out = diva.px.reconstruct_image(x_1, x_1var, x_2, x_2var, x_3)

    plt.figure(figsize=(80,20))
    fig, ax = plt.subplots(nrows=10, ncols=2)

    ax[0,0].set_title("Original")
    ax[0,1].set_title("Reconstructed")

    for i in range(10):
        ax[i, 1].imshow(out[i])
        ax[i, 0].imshow(x[i].cpu().permute(1,2,0))
        ax[i, 0].xaxis.set_visible(False)
        ax[i, 0].yaxis.set_visible(False)
        ax[i, 1].xaxis.set_visible(False)
        ax[i, 1].yaxis.set_visible(False)
    fig.tight_layout(pad=0.1)
    plt.savefig(f'{link}/saved_models/{name}/reconstructions/e{epoch}{estr}.png')
    plt.close('all')

In [36]:
DEVICE

device(type='cuda')

## Model Training

In [37]:
default_args = diva_args(z_dim=1600, rec_alpha = 100, rec_beta = 10, rec_gamma = 10, 
                         beta=1, warmup=1, prewarmup=0)

In [41]:
diva = StampDIVA(default_args).to(DEVICE)

In [40]:
#diva.load_state_dict(torch.load(f'{link}/saved_models/VAE10/checkpoints/905.pth'))

In [42]:
train_loader = DataLoader(RNA_dataset, batch_size=128, shuffle=True)
test_loader = DataLoader(RNA_dataset_test, batch_size=128)

In [44]:
optimizer = optim.Adam(diva.parameters(), lr=0.0005)

In [45]:
RNA_dataset.x_len.min(), RNA_dataset.x_len.max()

(10, 100)

In [47]:
%tensorboard --logdir="D:/users/Marko/downloads/mirna/saved_models/VAE11/tensorboard/"

In [48]:
lss, lss_t = train(default_args, train_loader, test_loader, diva, optimizer, 2000, 0, save_folder="VAE11",save_interval=5)

Epoch 1: 272batch [00:21, 12.80batch/s, loss=1.8e+3] 


epoch 1: avg train loss 1869.16, bar train loss 11.398, len train loss 0.457, col train loss 169.513
epoch 1: avg test  loss 1817.56, bar  test loss 9.837, len  test loss 0.160, col  test loss 169.337


Epoch 2: 272batch [00:18, 14.53batch/s, loss=1.73e+3]


epoch 2: avg train loss 1802.40, bar train loss 8.784, len train loss 0.128, col train loss 168.947


Epoch 3: 2batch [00:00, 14.49batch/s, loss=1.85e+3]

epoch 2: avg test  loss 1793.37, bar  test loss 8.603, len  test loss 0.144, col  test loss 167.955


Epoch 3: 272batch [00:18, 14.53batch/s, loss=1.75e+3]


epoch 3: avg train loss 1787.02, bar train loss 8.234, len train loss 0.132, col train loss 167.618


Epoch 4: 2batch [00:00, 14.82batch/s, loss=1.83e+3]

epoch 3: avg test  loss 1782.94, bar  test loss 7.966, len  test loss 0.114, col  test loss 167.513


Epoch 4: 272batch [00:18, 14.52batch/s, loss=1.9e+3] 


epoch 4: avg train loss 1777.67, bar train loss 7.662, len train loss 0.116, col train loss 167.223


Epoch 5: 2batch [00:00, 14.71batch/s, loss=1.72e+3]

epoch 4: avg test  loss 1772.49, bar  test loss 7.346, len  test loss 0.114, col  test loss 166.866


Epoch 5: 272batch [00:18, 14.50batch/s, loss=1.8e+3] 


epoch 5: avg train loss 1769.01, bar train loss 6.868, len train loss 0.118, col train loss 166.814
epoch 5: avg test  loss 1769.05, bar  test loss 6.608, len  test loss 0.146, col  test loss 166.750


Epoch 6: 272batch [00:18, 14.50batch/s, loss=1.85e+3]


epoch 6: avg train loss 1760.11, bar train loss 6.184, len train loss 0.118, col train loss 166.320


Epoch 7: 2batch [00:00, 14.60batch/s, loss=1.78e+3]

epoch 6: avg test  loss 1753.65, bar  test loss 5.906, len  test loss 0.109, col  test loss 165.946


Epoch 7: 272batch [00:18, 14.42batch/s, loss=1.75e+3]


epoch 7: avg train loss 1753.02, bar train loss 5.812, len train loss 0.116, col train loss 165.802


Epoch 8: 2batch [00:00, 14.29batch/s, loss=1.74e+3]

epoch 7: avg test  loss 1751.75, bar  test loss 5.612, len  test loss 0.138, col  test loss 165.573


Epoch 8: 272batch [00:19, 14.15batch/s, loss=1.8e+3] 


epoch 8: avg train loss 1747.46, bar train loss 5.535, len train loss 0.110, col train loss 165.442


Epoch 9: 2batch [00:00, 14.81batch/s, loss=1.8e+3]

epoch 8: avg test  loss 1744.67, bar  test loss 5.359, len  test loss 0.105, col  test loss 165.338


Epoch 9: 272batch [00:18, 14.50batch/s, loss=1.78e+3]


epoch 9: avg train loss 1744.25, bar train loss 5.361, len train loss 0.110, col train loss 165.169


Epoch 10: 2batch [00:00, 14.29batch/s, loss=1.72e+3]

epoch 9: avg test  loss 1741.73, bar  test loss 5.246, len  test loss 0.107, col  test loss 164.937


Epoch 10: 272batch [00:18, 14.45batch/s, loss=1.84e+3]


epoch 10: avg train loss 1740.67, bar train loss 5.204, len train loss 0.107, col train loss 164.891
epoch 10: avg test  loss 1747.69, bar  test loss 5.261, len  test loss 0.147, col  test loss 164.810


Epoch 11: 272batch [00:18, 14.49batch/s, loss=1.74e+3]


epoch 11: avg train loss 1737.88, bar train loss 5.078, len train loss 0.105, col train loss 164.650


Epoch 12: 2batch [00:00, 14.49batch/s, loss=1.68e+3]

epoch 11: avg test  loss 1737.45, bar  test loss 5.057, len  test loss 0.100, col  test loss 164.715


Epoch 12: 272batch [00:18, 14.38batch/s, loss=1.75e+3]


epoch 12: avg train loss 1735.47, bar train loss 4.982, len train loss 0.106, col train loss 164.411


Epoch 13: 2batch [00:00, 14.49batch/s, loss=1.73e+3]

epoch 12: avg test  loss 1736.38, bar  test loss 4.865, len  test loss 0.133, col  test loss 164.285


Epoch 13: 272batch [00:18, 14.43batch/s, loss=1.77e+3]


epoch 13: avg train loss 1732.63, bar train loss 4.902, len train loss 0.102, col train loss 164.139


Epoch 14: 2batch [00:00, 14.18batch/s, loss=1.79e+3]

epoch 13: avg test  loss 1729.99, bar  test loss 4.842, len  test loss 0.092, col  test loss 164.005


Epoch 14: 272batch [00:18, 14.46batch/s, loss=1.64e+3]


epoch 14: avg train loss 1729.31, bar train loss 4.858, len train loss 0.103, col train loss 163.709


Epoch 15: 2batch [00:00, 14.39batch/s, loss=1.74e+3]

epoch 14: avg test  loss 1729.41, bar  test loss 4.860, len  test loss 0.121, col  test loss 163.449


Epoch 15: 272batch [00:18, 14.42batch/s, loss=1.86e+3]


epoch 15: avg train loss 1683.95, bar train loss 4.593, len train loss 0.101, col train loss 158.766
epoch 15: avg test  loss 1657.78, bar  test loss 4.642, len  test loss 0.099, col  test loss 155.813


Epoch 16: 272batch [00:18, 14.42batch/s, loss=1.61e+3]


epoch 16: avg train loss 1650.27, bar train loss 4.393, len train loss 0.101, col train loss 155.144


Epoch 17: 2batch [00:00, 14.49batch/s, loss=1.73e+3]

epoch 16: avg test  loss 1648.04, bar  test loss 4.533, len  test loss 0.098, col  test loss 154.773


Epoch 17: 272batch [00:19, 14.17batch/s, loss=1.72e+3]


epoch 17: avg train loss 1642.80, bar train loss 4.323, len train loss 0.100, col train loss 154.284


Epoch 18: 2batch [00:00, 14.49batch/s, loss=1.67e+3]

epoch 17: avg test  loss 1643.00, bar  test loss 4.242, len  test loss 0.095, col  test loss 154.166


Epoch 18: 272batch [00:18, 14.41batch/s, loss=1.64e+3]


epoch 18: avg train loss 1635.49, bar train loss 4.248, len train loss 0.094, col train loss 153.512


Epoch 19: 2batch [00:00, 14.39batch/s, loss=1.58e+3]

epoch 18: avg test  loss 1631.86, bar  test loss 4.180, len  test loss 0.090, col  test loss 153.112


Epoch 19: 272batch [00:19, 14.31batch/s, loss=1.52e+3]


epoch 19: avg train loss 1630.20, bar train loss 4.192, len train loss 0.096, col train loss 152.845


Epoch 20: 2batch [00:00, 14.18batch/s, loss=1.65e+3]

epoch 19: avg test  loss 1629.86, bar  test loss 4.359, len  test loss 0.094, col  test loss 152.562


Epoch 20: 272batch [00:18, 14.41batch/s, loss=1.66e+3]


epoch 20: avg train loss 1625.25, bar train loss 4.145, len train loss 0.091, col train loss 152.320
epoch 20: avg test  loss 1624.41, bar  test loss 4.192, len  test loss 0.089, col  test loss 152.426


Epoch 21: 272batch [00:18, 14.42batch/s, loss=1.72e+3]


epoch 21: avg train loss 1622.00, bar train loss 4.103, len train loss 0.091, col train loss 151.907


Epoch 22: 2batch [00:00, 14.49batch/s, loss=1.57e+3]

epoch 21: avg test  loss 1625.35, bar  test loss 4.396, len  test loss 0.085, col  test loss 152.049


Epoch 22: 272batch [00:18, 14.40batch/s, loss=1.67e+3]


epoch 22: avg train loss 1618.76, bar train loss 4.072, len train loss 0.091, col train loss 151.517


Epoch 23: 2batch [00:00, 13.51batch/s, loss=1.64e+3]

epoch 22: avg test  loss 1618.38, bar  test loss 4.050, len  test loss 0.089, col  test loss 151.537


Epoch 23: 272batch [00:19, 14.01batch/s, loss=1.51e+3]


epoch 23: avg train loss 1616.12, bar train loss 4.044, len train loss 0.089, col train loss 151.201


Epoch 24: 2batch [00:00, 14.29batch/s, loss=1.66e+3]

epoch 23: avg test  loss 1618.16, bar  test loss 4.084, len  test loss 0.101, col  test loss 151.577


Epoch 24: 272batch [00:19, 14.28batch/s, loss=1.61e+3]


epoch 24: avg train loss 1613.35, bar train loss 3.995, len train loss 0.088, col train loss 150.878


Epoch 25: 2batch [00:00, 14.49batch/s, loss=1.62e+3]

epoch 24: avg test  loss 1616.54, bar  test loss 4.046, len  test loss 0.113, col  test loss 150.883


Epoch 25: 272batch [00:19, 14.25batch/s, loss=1.62e+3]


epoch 25: avg train loss 1611.29, bar train loss 3.970, len train loss 0.090, col train loss 150.638
epoch 25: avg test  loss 1611.47, bar  test loss 3.945, len  test loss 0.086, col  test loss 150.525


Epoch 26: 272batch [00:19, 14.11batch/s, loss=1.79e+3]


epoch 26: avg train loss 1608.94, bar train loss 3.952, len train loss 0.087, col train loss 150.365


Epoch 27: 2batch [00:00, 14.18batch/s, loss=1.58e+3]

epoch 26: avg test  loss 1609.52, bar  test loss 3.900, len  test loss 0.078, col  test loss 150.478


Epoch 27: 272batch [00:19, 14.31batch/s, loss=1.7e+3] 


epoch 27: avg train loss 1606.87, bar train loss 3.923, len train loss 0.085, col train loss 150.143


Epoch 28: 2batch [00:00, 14.49batch/s, loss=1.6e+3]

epoch 27: avg test  loss 1608.24, bar  test loss 3.997, len  test loss 0.084, col  test loss 150.098


Epoch 28: 272batch [00:19, 14.31batch/s, loss=1.69e+3]


epoch 28: avg train loss 1604.97, bar train loss 3.896, len train loss 0.084, col train loss 149.899


Epoch 29: 2batch [00:00, 14.71batch/s, loss=1.62e+3]

epoch 28: avg test  loss 1606.28, bar  test loss 3.912, len  test loss 0.081, col  test loss 150.192


Epoch 29: 272batch [00:18, 14.32batch/s, loss=1.72e+3]


epoch 29: avg train loss 1603.40, bar train loss 3.880, len train loss 0.086, col train loss 149.698


Epoch 30: 2batch [00:00, 14.60batch/s, loss=1.63e+3]

epoch 29: avg test  loss 1606.42, bar  test loss 3.919, len  test loss 0.082, col  test loss 149.987


Epoch 30: 272batch [00:19, 14.28batch/s, loss=1.59e+3]


epoch 30: avg train loss 1601.31, bar train loss 3.842, len train loss 0.083, col train loss 149.482
epoch 30: avg test  loss 1604.39, bar  test loss 3.929, len  test loss 0.082, col  test loss 149.677


Epoch 31: 272batch [00:18, 14.32batch/s, loss=1.54e+3]


epoch 31: avg train loss 1599.97, bar train loss 3.824, len train loss 0.083, col train loss 149.321


Epoch 32: 2batch [00:00, 14.60batch/s, loss=1.59e+3]

epoch 31: avg test  loss 1601.45, bar  test loss 3.830, len  test loss 0.080, col  test loss 149.512


Epoch 32: 272batch [00:18, 14.32batch/s, loss=1.74e+3]


epoch 32: avg train loss 1598.03, bar train loss 3.807, len train loss 0.081, col train loss 149.108


Epoch 33: 2batch [00:00, 14.08batch/s, loss=1.6e+3]

epoch 32: avg test  loss 1601.04, bar  test loss 3.773, len  test loss 0.082, col  test loss 149.403


Epoch 33: 272batch [00:19, 14.28batch/s, loss=1.59e+3]


epoch 33: avg train loss 1596.82, bar train loss 3.788, len train loss 0.081, col train loss 148.957


Epoch 34: 2batch [00:00, 13.99batch/s, loss=1.53e+3]

epoch 33: avg test  loss 1599.71, bar  test loss 3.863, len  test loss 0.081, col  test loss 149.270


Epoch 34: 272batch [00:19, 14.07batch/s, loss=1.64e+3]


epoch 34: avg train loss 1594.76, bar train loss 3.786, len train loss 0.079, col train loss 148.761


Epoch 35: 2batch [00:00, 14.39batch/s, loss=1.57e+3]

epoch 34: avg test  loss 1598.98, bar  test loss 3.874, len  test loss 0.084, col  test loss 148.960


Epoch 35: 272batch [00:19, 14.29batch/s, loss=1.64e+3]


epoch 35: avg train loss 1593.40, bar train loss 3.758, len train loss 0.078, col train loss 148.620
epoch 35: avg test  loss 1596.79, bar  test loss 3.766, len  test loss 0.083, col  test loss 148.796


Epoch 36: 272batch [00:19, 14.27batch/s, loss=1.59e+3]


epoch 36: avg train loss 1592.00, bar train loss 3.734, len train loss 0.078, col train loss 148.460


Epoch 37: 2batch [00:00, 14.49batch/s, loss=1.65e+3]

epoch 36: avg test  loss 1595.72, bar  test loss 3.799, len  test loss 0.075, col  test loss 148.838


Epoch 37: 272batch [00:19, 14.09batch/s, loss=1.62e+3]


epoch 37: avg train loss 1590.30, bar train loss 3.695, len train loss 0.074, col train loss 148.333


Epoch 38: 2batch [00:00, 14.39batch/s, loss=1.57e+3]

epoch 37: avg test  loss 1596.22, bar  test loss 4.053, len  test loss 0.072, col  test loss 148.634


Epoch 38: 272batch [00:19, 14.27batch/s, loss=1.51e+3]


epoch 38: avg train loss 1588.79, bar train loss 3.690, len train loss 0.072, col train loss 148.184


Epoch 39: 2batch [00:00, 14.39batch/s, loss=1.6e+3]

epoch 38: avg test  loss 1594.62, bar  test loss 3.686, len  test loss 0.088, col  test loss 148.447


Epoch 39: 272batch [00:19, 14.30batch/s, loss=1.4e+3] 


epoch 39: avg train loss 1587.03, bar train loss 3.687, len train loss 0.069, col train loss 148.020


Epoch 40: 2batch [00:00, 14.18batch/s, loss=1.58e+3]

epoch 39: avg test  loss 1590.65, bar  test loss 3.736, len  test loss 0.068, col  test loss 148.463


Epoch 40: 272batch [00:19, 14.26batch/s, loss=1.73e+3]


epoch 40: avg train loss 1585.71, bar train loss 3.663, len train loss 0.068, col train loss 147.901
epoch 40: avg test  loss 1592.99, bar  test loss 3.869, len  test loss 0.085, col  test loss 148.483


Epoch 41: 272batch [00:19, 14.28batch/s, loss=1.53e+3]


epoch 41: avg train loss 1583.90, bar train loss 3.648, len train loss 0.065, col train loss 147.761


Epoch 42: 2batch [00:00, 14.39batch/s, loss=1.62e+3]

epoch 41: avg test  loss 1590.10, bar  test loss 3.688, len  test loss 0.090, col  test loss 148.044


Epoch 42: 272batch [00:19, 14.26batch/s, loss=1.58e+3]


epoch 42: avg train loss 1582.74, bar train loss 3.635, len train loss 0.064, col train loss 147.655


Epoch 43: 2batch [00:00, 14.08batch/s, loss=1.58e+3]

epoch 42: avg test  loss 1587.70, bar  test loss 3.743, len  test loss 0.064, col  test loss 147.981


Epoch 43: 272batch [00:19, 14.29batch/s, loss=1.48e+3]


epoch 43: avg train loss 1581.09, bar train loss 3.614, len train loss 0.061, col train loss 147.509


Epoch 44: 2batch [00:00, 14.60batch/s, loss=1.55e+3]

epoch 43: avg test  loss 1588.31, bar  test loss 3.627, len  test loss 0.099, col  test loss 147.944


Epoch 44: 272batch [00:19, 14.26batch/s, loss=1.6e+3] 


epoch 44: avg train loss 1580.33, bar train loss 3.597, len train loss 0.061, col train loss 147.415


Epoch 45: 2batch [00:00, 14.08batch/s, loss=1.59e+3]

epoch 44: avg test  loss 1584.04, bar  test loss 3.634, len  test loss 0.061, col  test loss 147.749


Epoch 45: 272batch [00:19, 14.26batch/s, loss=1.41e+3]


epoch 45: avg train loss 1578.98, bar train loss 3.594, len train loss 0.060, col train loss 147.286
epoch 45: avg test  loss 1584.08, bar  test loss 3.648, len  test loss 0.065, col  test loss 147.700


Epoch 46: 272batch [00:19, 14.20batch/s, loss=1.61e+3]


epoch 46: avg train loss 1577.92, bar train loss 3.581, len train loss 0.058, col train loss 147.183


Epoch 47: 2batch [00:00, 14.49batch/s, loss=1.6e+3]

epoch 46: avg test  loss 1583.33, bar  test loss 3.635, len  test loss 0.061, col  test loss 147.884


Epoch 47: 272batch [00:19, 14.29batch/s, loss=1.53e+3]


epoch 47: avg train loss 1576.50, bar train loss 3.557, len train loss 0.056, col train loss 147.046


Epoch 48: 2batch [00:00, 14.39batch/s, loss=1.55e+3]

epoch 47: avg test  loss 1582.30, bar  test loss 3.664, len  test loss 0.056, col  test loss 147.426


Epoch 48: 272batch [00:19, 14.31batch/s, loss=1.59e+3]


epoch 48: avg train loss 1575.88, bar train loss 3.566, len train loss 0.057, col train loss 146.938


Epoch 49: 2batch [00:00, 13.79batch/s, loss=1.61e+3]

epoch 48: avg test  loss 1581.00, bar  test loss 3.615, len  test loss 0.057, col  test loss 147.373


Epoch 49: 272batch [00:19, 14.26batch/s, loss=1.59e+3]


epoch 49: avg train loss 1574.54, bar train loss 3.546, len train loss 0.055, col train loss 146.825


Epoch 50: 2batch [00:00, 14.18batch/s, loss=1.54e+3]

epoch 49: avg test  loss 1579.26, bar  test loss 3.568, len  test loss 0.052, col  test loss 147.214


Epoch 50: 272batch [00:19, 14.26batch/s, loss=1.64e+3]


epoch 50: avg train loss 1573.66, bar train loss 3.528, len train loss 0.054, col train loss 146.742
epoch 50: avg test  loss 1578.52, bar  test loss 3.543, len  test loss 0.051, col  test loss 147.179


Epoch 51: 272batch [00:19, 14.28batch/s, loss=1.46e+3]


epoch 51: avg train loss 1572.11, bar train loss 3.510, len train loss 0.051, col train loss 146.595


Epoch 52: 2batch [00:00, 14.08batch/s, loss=1.61e+3]

epoch 51: avg test  loss 1577.89, bar  test loss 3.549, len  test loss 0.056, col  test loss 147.029


Epoch 52: 272batch [00:19, 14.25batch/s, loss=1.56e+3]


epoch 52: avg train loss 1571.50, bar train loss 3.504, len train loss 0.050, col train loss 146.537


Epoch 53: 2batch [00:00, 14.49batch/s, loss=1.54e+3]

epoch 52: avg test  loss 1577.95, bar  test loss 3.534, len  test loss 0.058, col  test loss 146.936


Epoch 53: 272batch [00:19, 14.25batch/s, loss=1.58e+3]


epoch 53: avg train loss 1570.44, bar train loss 3.482, len train loss 0.050, col train loss 146.425


Epoch 54: 2batch [00:00, 13.89batch/s, loss=1.54e+3]

epoch 53: avg test  loss 1577.08, bar  test loss 3.538, len  test loss 0.059, col  test loss 147.097


Epoch 54: 272batch [00:19, 14.28batch/s, loss=1.43e+3]


epoch 54: avg train loss 1569.50, bar train loss 3.473, len train loss 0.049, col train loss 146.324


Epoch 55: 2batch [00:00, 14.39batch/s, loss=1.55e+3]

epoch 54: avg test  loss 1575.54, bar  test loss 3.555, len  test loss 0.049, col  test loss 147.002


Epoch 55: 272batch [00:19, 14.24batch/s, loss=1.54e+3]


epoch 55: avg train loss 1567.97, bar train loss 3.466, len train loss 0.049, col train loss 146.178
epoch 55: avg test  loss 1573.86, bar  test loss 3.465, len  test loss 0.049, col  test loss 146.667


Epoch 56: 272batch [00:19, 14.24batch/s, loss=1.57e+3]


epoch 56: avg train loss 1567.01, bar train loss 3.453, len train loss 0.046, col train loss 146.097


Epoch 57: 2batch [00:00, 13.79batch/s, loss=1.57e+3]

epoch 56: avg test  loss 1573.15, bar  test loss 3.539, len  test loss 0.051, col  test loss 146.902


Epoch 57: 272batch [00:19, 14.04batch/s, loss=1.65e+3]


epoch 57: avg train loss 1566.45, bar train loss 3.449, len train loss 0.047, col train loss 146.007


Epoch 58: 2batch [00:00, 14.49batch/s, loss=1.53e+3]

epoch 57: avg test  loss 1572.27, bar  test loss 3.485, len  test loss 0.052, col  test loss 146.306


Epoch 58: 272batch [00:19, 14.20batch/s, loss=1.71e+3]


epoch 58: avg train loss 1564.95, bar train loss 3.433, len train loss 0.046, col train loss 145.856


Epoch 59: 2batch [00:00, 14.49batch/s, loss=1.59e+3]

epoch 58: avg test  loss 1572.25, bar  test loss 3.497, len  test loss 0.047, col  test loss 146.625


Epoch 59: 272batch [00:19, 14.19batch/s, loss=1.65e+3]


epoch 59: avg train loss 1563.81, bar train loss 3.407, len train loss 0.045, col train loss 145.739


Epoch 60: 2batch [00:00, 14.29batch/s, loss=1.52e+3]

epoch 59: avg test  loss 1570.09, bar  test loss 3.474, len  test loss 0.046, col  test loss 146.486


Epoch 60: 272batch [00:19, 14.20batch/s, loss=1.55e+3]


epoch 60: avg train loss 1563.22, bar train loss 3.411, len train loss 0.045, col train loss 145.670
epoch 60: avg test  loss 1568.13, bar  test loss 3.475, len  test loss 0.044, col  test loss 146.119


Epoch 61: 272batch [00:19, 13.82batch/s, loss=1.55e+3]


epoch 61: avg train loss 1562.06, bar train loss 3.386, len train loss 0.043, col train loss 145.553


Epoch 62: 2batch [00:00, 13.89batch/s, loss=1.58e+3]

epoch 61: avg test  loss 1570.01, bar  test loss 3.418, len  test loss 0.045, col  test loss 146.426


Epoch 62: 272batch [00:19, 14.07batch/s, loss=1.73e+3]


epoch 62: avg train loss 1561.05, bar train loss 3.377, len train loss 0.043, col train loss 145.456


Epoch 63: 2batch [00:00, 14.18batch/s, loss=1.59e+3]

epoch 62: avg test  loss 1568.81, bar  test loss 3.428, len  test loss 0.048, col  test loss 145.730


Epoch 63: 272batch [00:19, 14.20batch/s, loss=1.59e+3]


epoch 63: avg train loss 1560.14, bar train loss 3.365, len train loss 0.045, col train loss 145.344


Epoch 64: 2batch [00:00, 14.39batch/s, loss=1.63e+3]

epoch 63: avg test  loss 1567.20, bar  test loss 3.486, len  test loss 0.045, col  test loss 146.106


Epoch 64: 272batch [00:19, 14.21batch/s, loss=1.59e+3]


epoch 64: avg train loss 1558.88, bar train loss 3.348, len train loss 0.042, col train loss 145.235


Epoch 65: 2batch [00:00, 14.39batch/s, loss=1.6e+3]

epoch 64: avg test  loss 1566.43, bar  test loss 3.458, len  test loss 0.044, col  test loss 145.905


Epoch 65: 272batch [00:19, 14.17batch/s, loss=1.65e+3]


epoch 65: avg train loss 1557.80, bar train loss 3.337, len train loss 0.043, col train loss 145.111
epoch 65: avg test  loss 1565.12, bar  test loss 3.335, len  test loss 0.044, col  test loss 145.762


Epoch 66: 272batch [00:19, 14.21batch/s, loss=1.46e+3]


epoch 66: avg train loss 1556.83, bar train loss 3.319, len train loss 0.042, col train loss 145.003


Epoch 67: 2batch [00:00, 14.39batch/s, loss=1.49e+3]

epoch 66: avg test  loss 1564.00, bar  test loss 3.468, len  test loss 0.044, col  test loss 145.619


Epoch 67: 272batch [00:19, 13.83batch/s, loss=1.55e+3]


epoch 67: avg train loss 1555.63, bar train loss 3.316, len train loss 0.041, col train loss 144.890


Epoch 68: 2batch [00:00, 14.08batch/s, loss=1.55e+3]

epoch 67: avg test  loss 1563.42, bar  test loss 3.355, len  test loss 0.043, col  test loss 145.602


Epoch 68: 272batch [00:19, 14.16batch/s, loss=1.55e+3]


epoch 68: avg train loss 1554.77, bar train loss 3.297, len train loss 0.041, col train loss 144.793


Epoch 69: 2batch [00:00, 14.08batch/s, loss=1.56e+3]

epoch 68: avg test  loss 1561.30, bar  test loss 3.331, len  test loss 0.041, col  test loss 145.586


Epoch 69: 272batch [00:19, 14.17batch/s, loss=1.65e+3]


epoch 69: avg train loss 1553.45, bar train loss 3.289, len train loss 0.041, col train loss 144.649


Epoch 70: 2batch [00:00, 13.99batch/s, loss=1.52e+3]

epoch 69: avg test  loss 1561.54, bar  test loss 3.433, len  test loss 0.044, col  test loss 145.406


Epoch 70: 272batch [00:19, 14.15batch/s, loss=1.61e+3]


epoch 70: avg train loss 1552.36, bar train loss 3.276, len train loss 0.041, col train loss 144.521
epoch 70: avg test  loss 1559.82, bar  test loss 3.270, len  test loss 0.040, col  test loss 145.237


Epoch 71: 272batch [00:19, 14.15batch/s, loss=1.46e+3]


epoch 71: avg train loss 1551.59, bar train loss 3.275, len train loss 0.040, col train loss 144.428


Epoch 72: 2batch [00:00, 14.18batch/s, loss=1.51e+3]

epoch 71: avg test  loss 1559.14, bar  test loss 3.395, len  test loss 0.042, col  test loss 145.018


Epoch 72: 272batch [00:19, 14.14batch/s, loss=1.5e+3] 


epoch 72: avg train loss 1549.94, bar train loss 3.244, len train loss 0.040, col train loss 144.262


Epoch 73: 2batch [00:00, 13.79batch/s, loss=1.59e+3]

epoch 72: avg test  loss 1559.60, bar  test loss 3.347, len  test loss 0.042, col  test loss 145.204


Epoch 73: 272batch [00:19, 14.11batch/s, loss=1.37e+3]


epoch 73: avg train loss 1549.08, bar train loss 3.237, len train loss 0.039, col train loss 144.179


Epoch 74: 2batch [00:00, 14.08batch/s, loss=1.5e+3]

epoch 73: avg test  loss 1556.14, bar  test loss 3.275, len  test loss 0.042, col  test loss 144.895


Epoch 74: 272batch [00:19, 14.14batch/s, loss=1.51e+3]


epoch 74: avg train loss 1547.87, bar train loss 3.211, len train loss 0.040, col train loss 144.040


Epoch 75: 2batch [00:00, 14.08batch/s, loss=1.56e+3]

epoch 74: avg test  loss 1556.34, bar  test loss 3.310, len  test loss 0.042, col  test loss 144.768


Epoch 75: 272batch [00:19, 14.08batch/s, loss=1.62e+3]


epoch 75: avg train loss 1546.49, bar train loss 3.208, len train loss 0.038, col train loss 143.911
epoch 75: avg test  loss 1554.32, bar  test loss 3.218, len  test loss 0.039, col  test loss 144.728


Epoch 76: 272batch [00:19, 13.81batch/s, loss=1.56e+3]


epoch 76: avg train loss 1545.71, bar train loss 3.198, len train loss 0.039, col train loss 143.800


Epoch 77: 2batch [00:00, 14.08batch/s, loss=1.55e+3]

epoch 76: avg test  loss 1553.28, bar  test loss 3.248, len  test loss 0.038, col  test loss 144.371


Epoch 77: 272batch [00:19, 14.11batch/s, loss=1.58e+3]


epoch 77: avg train loss 1544.29, bar train loss 3.172, len train loss 0.038, col train loss 143.677


Epoch 78: 2batch [00:00, 14.39batch/s, loss=1.55e+3]

epoch 77: avg test  loss 1553.32, bar  test loss 3.300, len  test loss 0.038, col  test loss 144.549


Epoch 78: 272batch [00:19, 14.09batch/s, loss=1.51e+3]


epoch 78: avg train loss 1543.66, bar train loss 3.171, len train loss 0.039, col train loss 143.559


Epoch 79: 2batch [00:00, 14.29batch/s, loss=1.57e+3]

epoch 78: avg test  loss 1553.07, bar  test loss 3.274, len  test loss 0.038, col  test loss 144.283


Epoch 79: 272batch [00:19, 14.11batch/s, loss=1.46e+3]


epoch 79: avg train loss 1542.57, bar train loss 3.158, len train loss 0.038, col train loss 143.458


Epoch 80: 2batch [00:00, 13.79batch/s, loss=1.54e+3]

epoch 79: avg test  loss 1551.31, bar  test loss 3.221, len  test loss 0.037, col  test loss 144.233


Epoch 80: 272batch [00:19, 14.11batch/s, loss=1.5e+3] 


epoch 80: avg train loss 1541.62, bar train loss 3.155, len train loss 0.038, col train loss 143.371
epoch 80: avg test  loss 1550.59, bar  test loss 3.258, len  test loss 0.050, col  test loss 144.028


Epoch 81: 272batch [00:19, 14.10batch/s, loss=1.36e+3]


epoch 81: avg train loss 1540.48, bar train loss 3.132, len train loss 0.037, col train loss 143.247


Epoch 82: 2batch [00:00, 14.18batch/s, loss=1.6e+3]

epoch 81: avg test  loss 1549.35, bar  test loss 3.163, len  test loss 0.040, col  test loss 144.138


Epoch 82: 272batch [00:19, 14.13batch/s, loss=1.53e+3]


epoch 82: avg train loss 1539.67, bar train loss 3.130, len train loss 0.038, col train loss 143.125


Epoch 83: 2batch [00:00, 13.99batch/s, loss=1.56e+3]

epoch 82: avg test  loss 1547.75, bar  test loss 3.212, len  test loss 0.039, col  test loss 144.077


Epoch 83: 272batch [00:19, 13.89batch/s, loss=1.51e+3]


epoch 83: avg train loss 1538.40, bar train loss 3.113, len train loss 0.037, col train loss 143.026


Epoch 84: 2batch [00:00, 14.08batch/s, loss=1.52e+3]

epoch 83: avg test  loss 1548.14, bar  test loss 3.192, len  test loss 0.040, col  test loss 144.072


Epoch 84: 272batch [00:20, 13.53batch/s, loss=1.32e+3]


epoch 84: avg train loss 1537.93, bar train loss 3.109, len train loss 0.038, col train loss 142.962


Epoch 85: 2batch [00:00, 13.99batch/s, loss=1.53e+3]

epoch 84: avg test  loss 1546.97, bar  test loss 3.213, len  test loss 0.039, col  test loss 143.810


Epoch 85: 272batch [00:19, 14.05batch/s, loss=1.54e+3]


epoch 85: avg train loss 1536.65, bar train loss 3.090, len train loss 0.037, col train loss 142.820
epoch 85: avg test  loss 1545.18, bar  test loss 3.120, len  test loss 0.037, col  test loss 143.323


Epoch 86: 272batch [00:19, 13.92batch/s, loss=1.55e+3]


epoch 86: avg train loss 1535.46, bar train loss 3.073, len train loss 0.036, col train loss 142.682


Epoch 87: 2batch [00:00, 13.70batch/s, loss=1.56e+3]

epoch 86: avg test  loss 1546.03, bar  test loss 3.121, len  test loss 0.040, col  test loss 143.773


Epoch 87: 272batch [00:19, 13.66batch/s, loss=1.58e+3]


epoch 87: avg train loss 1534.66, bar train loss 3.066, len train loss 0.036, col train loss 142.597


Epoch 88: 2batch [00:00, 14.08batch/s, loss=1.51e+3]

epoch 87: avg test  loss 1543.78, bar  test loss 3.139, len  test loss 0.039, col  test loss 143.537


Epoch 88: 272batch [00:19, 14.08batch/s, loss=1.53e+3]


epoch 88: avg train loss 1533.53, bar train loss 3.051, len train loss 0.036, col train loss 142.440


Epoch 89: 2batch [00:00, 14.08batch/s, loss=1.54e+3]

epoch 88: avg test  loss 1542.08, bar  test loss 3.116, len  test loss 0.039, col  test loss 143.264


Epoch 89: 272batch [00:19, 14.04batch/s, loss=1.64e+3]


epoch 89: avg train loss 1532.84, bar train loss 3.045, len train loss 0.036, col train loss 142.386


Epoch 90: 2batch [00:00, 14.08batch/s, loss=1.44e+3]

epoch 89: avg test  loss 1541.46, bar  test loss 3.099, len  test loss 0.039, col  test loss 143.105


Epoch 90: 272batch [00:19, 13.66batch/s, loss=1.59e+3]


epoch 90: avg train loss 1531.53, bar train loss 3.019, len train loss 0.036, col train loss 142.262
epoch 90: avg test  loss 1540.60, bar  test loss 3.091, len  test loss 0.035, col  test loss 143.048


Epoch 91: 272batch [00:19, 13.96batch/s, loss=1.57e+3]


epoch 91: avg train loss 1530.45, bar train loss 3.016, len train loss 0.036, col train loss 142.149


Epoch 92: 2batch [00:00, 14.08batch/s, loss=1.52e+3]

epoch 91: avg test  loss 1540.16, bar  test loss 3.104, len  test loss 0.041, col  test loss 142.975


Epoch 92: 272batch [00:19, 13.97batch/s, loss=1.72e+3]


epoch 92: avg train loss 1529.70, bar train loss 2.999, len train loss 0.035, col train loss 142.060


Epoch 93: 2batch [00:00, 13.70batch/s, loss=1.5e+3]

epoch 92: avg test  loss 1539.96, bar  test loss 3.087, len  test loss 0.038, col  test loss 143.007


Epoch 93: 272batch [00:20, 13.58batch/s, loss=1.61e+3]


epoch 93: avg train loss 1529.07, bar train loss 2.993, len train loss 0.035, col train loss 142.002


Epoch 94: 2batch [00:00, 13.99batch/s, loss=1.56e+3]

epoch 93: avg test  loss 1537.84, bar  test loss 3.032, len  test loss 0.036, col  test loss 142.865


Epoch 94: 272batch [00:19, 13.82batch/s, loss=1.54e+3]


epoch 94: avg train loss 1527.90, bar train loss 2.986, len train loss 0.036, col train loss 141.846


Epoch 95: 2batch [00:00, 13.61batch/s, loss=1.45e+3]

epoch 94: avg test  loss 1539.03, bar  test loss 3.055, len  test loss 0.042, col  test loss 142.664


Epoch 95: 272batch [00:19, 13.83batch/s, loss=1.46e+3]


epoch 95: avg train loss 1527.11, bar train loss 2.990, len train loss 0.035, col train loss 141.761
epoch 95: avg test  loss 1537.75, bar  test loss 3.056, len  test loss 0.035, col  test loss 142.685


Epoch 96: 272batch [00:19, 13.99batch/s, loss=1.58e+3]


epoch 96: avg train loss 1525.85, bar train loss 2.973, len train loss 0.035, col train loss 141.645


Epoch 97: 2batch [00:00, 14.18batch/s, loss=1.45e+3]

epoch 96: avg test  loss 1536.20, bar  test loss 3.058, len  test loss 0.038, col  test loss 142.540


Epoch 97: 272batch [00:19, 13.92batch/s, loss=1.53e+3]


epoch 97: avg train loss 1525.12, bar train loss 2.959, len train loss 0.036, col train loss 141.522


Epoch 98: 2batch [00:00, 14.08batch/s, loss=1.52e+3]

epoch 97: avg test  loss 1536.64, bar  test loss 3.012, len  test loss 0.036, col  test loss 142.689


Epoch 98: 272batch [00:19, 13.98batch/s, loss=1.55e+3]


epoch 98: avg train loss 1524.33, bar train loss 2.955, len train loss 0.035, col train loss 141.441


Epoch 99: 2batch [00:00, 14.29batch/s, loss=1.56e+3]

epoch 98: avg test  loss 1536.81, bar  test loss 3.071, len  test loss 0.036, col  test loss 142.548


Epoch 99: 272batch [00:19, 13.90batch/s, loss=1.42e+3]


epoch 99: avg train loss 1523.48, bar train loss 2.942, len train loss 0.035, col train loss 141.351


Epoch 100: 2batch [00:00, 14.18batch/s, loss=1.53e+3]

epoch 99: avg test  loss 1533.51, bar  test loss 3.051, len  test loss 0.036, col  test loss 142.354


Epoch 100: 272batch [00:19, 13.99batch/s, loss=1.45e+3]


epoch 100: avg train loss 1522.30, bar train loss 2.925, len train loss 0.034, col train loss 141.220
epoch 100: avg test  loss 1532.25, bar  test loss 3.002, len  test loss 0.034, col  test loss 141.901


Epoch 101: 272batch [00:19, 13.93batch/s, loss=1.38e+3]


epoch 101: avg train loss 1521.18, bar train loss 2.917, len train loss 0.034, col train loss 141.109


Epoch 102: 2batch [00:00, 13.70batch/s, loss=1.47e+3]

epoch 101: avg test  loss 1532.08, bar  test loss 3.010, len  test loss 0.037, col  test loss 142.199


Epoch 102: 272batch [00:19, 13.98batch/s, loss=1.59e+3]


epoch 102: avg train loss 1520.27, bar train loss 2.911, len train loss 0.034, col train loss 141.008


Epoch 103: 2batch [00:00, 14.29batch/s, loss=1.46e+3]

epoch 102: avg test  loss 1531.48, bar  test loss 2.990, len  test loss 0.035, col  test loss 142.006


Epoch 103: 272batch [00:19, 13.96batch/s, loss=1.55e+3]


epoch 103: avg train loss 1519.23, bar train loss 2.896, len train loss 0.033, col train loss 140.901


Epoch 104: 2batch [00:00, 14.08batch/s, loss=1.52e+3]

epoch 103: avg test  loss 1530.73, bar  test loss 3.000, len  test loss 0.035, col  test loss 142.191


Epoch 104: 272batch [00:19, 13.73batch/s, loss=1.46e+3]


epoch 104: avg train loss 1518.33, bar train loss 2.896, len train loss 0.034, col train loss 140.782


Epoch 105: 2batch [00:00, 13.61batch/s, loss=1.51e+3]

epoch 104: avg test  loss 1531.96, bar  test loss 3.135, len  test loss 0.037, col  test loss 141.949


Epoch 105: 272batch [00:20, 13.37batch/s, loss=1.51e+3]


epoch 105: avg train loss 1517.89, bar train loss 2.891, len train loss 0.034, col train loss 140.729
epoch 105: avg test  loss 1529.39, bar  test loss 2.940, len  test loss 0.034, col  test loss 141.778


Epoch 106: 272batch [00:19, 13.79batch/s, loss=1.45e+3]


epoch 106: avg train loss 1516.96, bar train loss 2.883, len train loss 0.034, col train loss 140.608


Epoch 107: 2batch [00:00, 13.89batch/s, loss=1.51e+3]

epoch 106: avg test  loss 1528.36, bar  test loss 2.999, len  test loss 0.036, col  test loss 141.638


Epoch 107: 272batch [00:19, 13.96batch/s, loss=1.51e+3]


epoch 107: avg train loss 1516.03, bar train loss 2.877, len train loss 0.033, col train loss 140.500


Epoch 108: 2batch [00:00, 13.61batch/s, loss=1.52e+3]

epoch 107: avg test  loss 1528.06, bar  test loss 2.963, len  test loss 0.049, col  test loss 141.600


Epoch 108: 272batch [00:19, 13.97batch/s, loss=1.53e+3]


epoch 108: avg train loss 1515.32, bar train loss 2.870, len train loss 0.034, col train loss 140.387


Epoch 109: 2batch [00:00, 14.08batch/s, loss=1.52e+3]

epoch 108: avg test  loss 1526.86, bar  test loss 2.927, len  test loss 0.037, col  test loss 141.425


Epoch 109: 272batch [00:19, 13.97batch/s, loss=1.53e+3]


epoch 109: avg train loss 1514.72, bar train loss 2.863, len train loss 0.033, col train loss 140.322


Epoch 110: 2batch [00:00, 13.99batch/s, loss=1.48e+3]

epoch 109: avg test  loss 1527.58, bar  test loss 2.970, len  test loss 0.053, col  test loss 141.108


Epoch 110: 272batch [00:19, 13.74batch/s, loss=1.61e+3]


epoch 110: avg train loss 1513.43, bar train loss 2.849, len train loss 0.034, col train loss 140.156
epoch 110: avg test  loss 1525.47, bar  test loss 2.933, len  test loss 0.041, col  test loss 141.035


Epoch 111: 272batch [00:20, 13.58batch/s, loss=1.49e+3]


epoch 111: avg train loss 1512.36, bar train loss 2.853, len train loss 0.033, col train loss 140.018


Epoch 112: 2batch [00:00, 14.08batch/s, loss=1.6e+3]

epoch 111: avg test  loss 1524.57, bar  test loss 2.910, len  test loss 0.034, col  test loss 141.467


Epoch 112: 272batch [00:19, 14.03batch/s, loss=1.54e+3]


epoch 112: avg train loss 1511.58, bar train loss 2.844, len train loss 0.033, col train loss 139.950


Epoch 113: 2batch [00:00, 13.51batch/s, loss=1.46e+3]

epoch 112: avg test  loss 1523.54, bar  test loss 3.003, len  test loss 0.034, col  test loss 140.998


Epoch 113: 272batch [00:19, 14.01batch/s, loss=1.44e+3]


epoch 113: avg train loss 1510.88, bar train loss 2.841, len train loss 0.033, col train loss 139.841


Epoch 114: 2batch [00:00, 13.99batch/s, loss=1.47e+3]

epoch 113: avg test  loss 1522.32, bar  test loss 2.916, len  test loss 0.035, col  test loss 141.059


Epoch 114: 272batch [00:19, 13.98batch/s, loss=1.63e+3]


epoch 114: avg train loss 1510.10, bar train loss 2.824, len train loss 0.033, col train loss 139.731


Epoch 115: 2batch [00:00, 13.33batch/s, loss=1.51e+3]

epoch 114: avg test  loss 1521.53, bar  test loss 2.946, len  test loss 0.033, col  test loss 141.057


Epoch 115: 272batch [00:19, 13.82batch/s, loss=1.55e+3]


epoch 115: avg train loss 1508.85, bar train loss 2.815, len train loss 0.032, col train loss 139.623
epoch 115: avg test  loss 1522.31, bar  test loss 3.002, len  test loss 0.033, col  test loss 140.829


Epoch 116: 272batch [00:19, 14.30batch/s, loss=1.56e+3]


epoch 116: avg train loss 1508.31, bar train loss 2.814, len train loss 0.032, col train loss 139.546


Epoch 117: 2batch [00:00, 14.08batch/s, loss=1.51e+3]

epoch 116: avg test  loss 1520.10, bar  test loss 2.914, len  test loss 0.035, col  test loss 140.662


Epoch 117: 272batch [00:18, 14.36batch/s, loss=1.47e+3]


epoch 117: avg train loss 1507.47, bar train loss 2.807, len train loss 0.032, col train loss 139.426


Epoch 118: 2batch [00:00, 14.29batch/s, loss=1.51e+3]

epoch 117: avg test  loss 1521.94, bar  test loss 2.904, len  test loss 0.035, col  test loss 140.739


Epoch 118: 272batch [00:18, 14.38batch/s, loss=1.45e+3]


epoch 118: avg train loss 1506.43, bar train loss 2.806, len train loss 0.032, col train loss 139.295


Epoch 119: 2batch [00:00, 14.60batch/s, loss=1.54e+3]

epoch 118: avg test  loss 1518.77, bar  test loss 2.853, len  test loss 0.034, col  test loss 140.315


Epoch 119: 272batch [00:18, 14.34batch/s, loss=1.6e+3] 


epoch 119: avg train loss 1505.25, bar train loss 2.795, len train loss 0.033, col train loss 139.182


Epoch 120: 2batch [00:00, 14.29batch/s, loss=1.47e+3]

epoch 119: avg test  loss 1517.97, bar  test loss 2.878, len  test loss 0.041, col  test loss 140.309


Epoch 120: 272batch [00:18, 14.35batch/s, loss=1.52e+3]


epoch 120: avg train loss 1504.79, bar train loss 2.784, len train loss 0.032, col train loss 139.120
epoch 120: avg test  loss 1517.31, bar  test loss 2.907, len  test loss 0.035, col  test loss 140.292


Epoch 121: 272batch [00:19, 13.84batch/s, loss=1.54e+3]


epoch 121: avg train loss 1504.21, bar train loss 2.786, len train loss 0.032, col train loss 139.023


Epoch 122: 2batch [00:00, 13.70batch/s, loss=1.49e+3]

epoch 121: avg test  loss 1516.80, bar  test loss 2.883, len  test loss 0.034, col  test loss 140.057


Epoch 122: 272batch [00:19, 13.76batch/s, loss=1.38e+3]


epoch 122: avg train loss 1503.06, bar train loss 2.775, len train loss 0.033, col train loss 138.893


Epoch 123: 2batch [00:00, 13.99batch/s, loss=1.53e+3]

epoch 122: avg test  loss 1516.48, bar  test loss 2.847, len  test loss 0.035, col  test loss 140.238


Epoch 123: 272batch [00:19, 13.76batch/s, loss=1.48e+3]


epoch 123: avg train loss 1501.92, bar train loss 2.767, len train loss 0.031, col train loss 138.746


Epoch 124: 2batch [00:00, 13.42batch/s, loss=1.54e+3]

epoch 123: avg test  loss 1514.20, bar  test loss 2.858, len  test loss 0.034, col  test loss 139.880


Epoch 124: 272batch [00:19, 13.66batch/s, loss=1.48e+3]


epoch 124: avg train loss 1501.82, bar train loss 2.771, len train loss 0.032, col train loss 138.716


Epoch 125: 2batch [00:00, 14.49batch/s, loss=1.51e+3]

epoch 124: avg test  loss 1514.92, bar  test loss 2.981, len  test loss 0.033, col  test loss 140.001


Epoch 125: 272batch [00:19, 13.98batch/s, loss=1.42e+3]


epoch 125: avg train loss 1500.62, bar train loss 2.766, len train loss 0.031, col train loss 138.583
epoch 125: avg test  loss 1515.32, bar  test loss 2.891, len  test loss 0.036, col  test loss 139.853


Epoch 126: 272batch [00:19, 13.99batch/s, loss=1.55e+3]


epoch 126: avg train loss 1500.20, bar train loss 2.750, len train loss 0.033, col train loss 138.487


Epoch 127: 2batch [00:00, 14.29batch/s, loss=1.55e+3]

epoch 126: avg test  loss 1511.99, bar  test loss 2.825, len  test loss 0.033, col  test loss 139.704


Epoch 127: 272batch [00:18, 14.32batch/s, loss=1.66e+3]


epoch 127: avg train loss 1499.37, bar train loss 2.757, len train loss 0.032, col train loss 138.410


Epoch 128: 2batch [00:00, 14.60batch/s, loss=1.42e+3]

epoch 127: avg test  loss 1513.08, bar  test loss 2.875, len  test loss 0.036, col  test loss 139.684


Epoch 128: 272batch [00:19, 14.30batch/s, loss=1.58e+3]


epoch 128: avg train loss 1498.90, bar train loss 2.746, len train loss 0.032, col train loss 138.356


Epoch 129: 2batch [00:00, 14.49batch/s, loss=1.48e+3]

epoch 128: avg test  loss 1514.16, bar  test loss 2.898, len  test loss 0.033, col  test loss 139.653


Epoch 129: 272batch [00:19, 14.23batch/s, loss=1.37e+3]


epoch 129: avg train loss 1497.91, bar train loss 2.740, len train loss 0.031, col train loss 138.214


Epoch 130: 2batch [00:00, 13.99batch/s, loss=1.53e+3]

epoch 129: avg test  loss 1510.73, bar  test loss 2.808, len  test loss 0.033, col  test loss 139.336


Epoch 130: 272batch [00:19, 14.15batch/s, loss=1.48e+3]


epoch 130: avg train loss 1497.00, bar train loss 2.733, len train loss 0.032, col train loss 138.118
epoch 130: avg test  loss 1510.60, bar  test loss 2.850, len  test loss 0.032, col  test loss 139.567


Epoch 131: 272batch [00:19, 14.14batch/s, loss=1.53e+3]


epoch 131: avg train loss 1495.85, bar train loss 2.728, len train loss 0.031, col train loss 137.983


Epoch 132: 2batch [00:00, 13.99batch/s, loss=1.49e+3]

epoch 131: avg test  loss 1511.38, bar  test loss 2.824, len  test loss 0.033, col  test loss 139.387


Epoch 132: 272batch [00:19, 14.12batch/s, loss=1.5e+3] 


epoch 132: avg train loss 1495.31, bar train loss 2.718, len train loss 0.031, col train loss 137.884


Epoch 133: 2batch [00:00, 13.33batch/s, loss=1.51e+3]

epoch 132: avg test  loss 1509.12, bar  test loss 2.784, len  test loss 0.031, col  test loss 139.290


Epoch 133: 272batch [00:20, 13.35batch/s, loss=1.43e+3]


epoch 133: avg train loss 1494.70, bar train loss 2.717, len train loss 0.032, col train loss 137.807


Epoch 134: 2batch [00:00, 14.08batch/s, loss=1.45e+3]

epoch 133: avg test  loss 1510.21, bar  test loss 2.791, len  test loss 0.038, col  test loss 138.891


Epoch 134: 272batch [00:20, 13.55batch/s, loss=1.53e+3]


epoch 134: avg train loss 1494.05, bar train loss 2.716, len train loss 0.032, col train loss 137.721


Epoch 135: 2batch [00:00, 14.39batch/s, loss=1.47e+3]

epoch 134: avg test  loss 1508.70, bar  test loss 2.788, len  test loss 0.035, col  test loss 139.016


Epoch 135: 272batch [00:19, 13.82batch/s, loss=1.52e+3]


epoch 135: avg train loss 1492.91, bar train loss 2.706, len train loss 0.031, col train loss 137.617
epoch 135: avg test  loss 1507.12, bar  test loss 2.827, len  test loss 0.032, col  test loss 138.944


Epoch 136: 272batch [00:20, 13.39batch/s, loss=1.45e+3]


epoch 136: avg train loss 1492.38, bar train loss 2.691, len train loss 0.031, col train loss 137.517


Epoch 137: 2batch [00:00, 14.08batch/s, loss=1.5e+3]

epoch 136: avg test  loss 1506.11, bar  test loss 2.778, len  test loss 0.033, col  test loss 139.013


Epoch 137: 272batch [00:19, 14.12batch/s, loss=1.38e+3]


epoch 137: avg train loss 1491.62, bar train loss 2.695, len train loss 0.031, col train loss 137.403


Epoch 138: 2batch [00:00, 14.08batch/s, loss=1.52e+3]

epoch 137: avg test  loss 1508.29, bar  test loss 2.829, len  test loss 0.046, col  test loss 138.920


Epoch 138: 272batch [00:19, 14.16batch/s, loss=1.57e+3]


epoch 138: avg train loss 1490.83, bar train loss 2.690, len train loss 0.032, col train loss 137.344


Epoch 139: 2batch [00:00, 14.39batch/s, loss=1.5e+3]

epoch 138: avg test  loss 1505.37, bar  test loss 2.757, len  test loss 0.033, col  test loss 138.642


Epoch 139: 272batch [00:19, 14.24batch/s, loss=1.59e+3]


epoch 139: avg train loss 1489.66, bar train loss 2.688, len train loss 0.031, col train loss 137.159


Epoch 140: 2batch [00:00, 14.29batch/s, loss=1.5e+3]

epoch 139: avg test  loss 1504.17, bar  test loss 2.751, len  test loss 0.032, col  test loss 138.593


Epoch 140: 272batch [00:19, 14.11batch/s, loss=1.48e+3]


epoch 140: avg train loss 1489.12, bar train loss 2.682, len train loss 0.031, col train loss 137.108
epoch 140: avg test  loss 1504.87, bar  test loss 2.791, len  test loss 0.032, col  test loss 138.585


Epoch 141: 272batch [00:19, 14.09batch/s, loss=1.61e+3]


epoch 141: avg train loss 1488.40, bar train loss 2.675, len train loss 0.031, col train loss 137.042


Epoch 142: 2batch [00:00, 14.08batch/s, loss=1.43e+3]

epoch 141: avg test  loss 1503.92, bar  test loss 2.783, len  test loss 0.033, col  test loss 138.577


Epoch 142: 272batch [00:19, 14.10batch/s, loss=1.6e+3] 


epoch 142: avg train loss 1487.72, bar train loss 2.676, len train loss 0.032, col train loss 136.902


Epoch 143: 2batch [00:00, 14.18batch/s, loss=1.43e+3]

epoch 142: avg test  loss 1502.66, bar  test loss 2.751, len  test loss 0.034, col  test loss 138.348


Epoch 143: 272batch [00:19, 14.13batch/s, loss=1.41e+3]


epoch 143: avg train loss 1486.74, bar train loss 2.670, len train loss 0.030, col train loss 136.808


Epoch 144: 2batch [00:00, 14.08batch/s, loss=1.52e+3]

epoch 143: avg test  loss 1503.15, bar  test loss 2.836, len  test loss 0.032, col  test loss 138.518


Epoch 144: 272batch [00:19, 13.72batch/s, loss=1.55e+3]


epoch 144: avg train loss 1486.24, bar train loss 2.661, len train loss 0.032, col train loss 136.731


Epoch 145: 2batch [00:00, 13.79batch/s, loss=1.52e+3]

epoch 144: avg test  loss 1501.14, bar  test loss 2.745, len  test loss 0.035, col  test loss 138.072


Epoch 145: 272batch [00:19, 13.63batch/s, loss=1.56e+3]


epoch 145: avg train loss 1485.36, bar train loss 2.661, len train loss 0.031, col train loss 136.579
epoch 145: avg test  loss 1501.64, bar  test loss 2.749, len  test loss 0.032, col  test loss 138.140


Epoch 146: 272batch [00:19, 13.74batch/s, loss=1.48e+3]


epoch 146: avg train loss 1484.28, bar train loss 2.657, len train loss 0.031, col train loss 136.453


Epoch 147: 2batch [00:00, 13.79batch/s, loss=1.41e+3]

epoch 146: avg test  loss 1499.87, bar  test loss 2.769, len  test loss 0.032, col  test loss 138.202


Epoch 147: 272batch [00:19, 13.82batch/s, loss=1.62e+3]


epoch 147: avg train loss 1483.66, bar train loss 2.663, len train loss 0.031, col train loss 136.371


Epoch 148: 2batch [00:00, 13.79batch/s, loss=1.46e+3]

epoch 147: avg test  loss 1498.24, bar  test loss 2.758, len  test loss 0.031, col  test loss 137.471


Epoch 148: 272batch [00:19, 13.81batch/s, loss=1.35e+3]


epoch 148: avg train loss 1482.50, bar train loss 2.652, len train loss 0.030, col train loss 136.223


Epoch 149: 2batch [00:00, 13.79batch/s, loss=1.52e+3]

epoch 148: avg test  loss 1501.77, bar  test loss 2.772, len  test loss 0.033, col  test loss 138.245


Epoch 149: 272batch [00:19, 13.81batch/s, loss=1.5e+3] 


epoch 149: avg train loss 1481.89, bar train loss 2.647, len train loss 0.030, col train loss 136.147


Epoch 150: 2batch [00:00, 13.89batch/s, loss=1.49e+3]

epoch 149: avg test  loss 1498.71, bar  test loss 2.778, len  test loss 0.032, col  test loss 137.732


Epoch 150: 272batch [00:19, 13.78batch/s, loss=1.35e+3]


epoch 150: avg train loss 1480.84, bar train loss 2.654, len train loss 0.031, col train loss 135.989
epoch 150: avg test  loss 1497.34, bar  test loss 2.774, len  test loss 0.033, col  test loss 137.631


Epoch 151: 272batch [00:19, 13.67batch/s, loss=1.58e+3]


epoch 151: avg train loss 1479.97, bar train loss 2.650, len train loss 0.030, col train loss 135.886


Epoch 152: 2batch [00:00, 13.42batch/s, loss=1.48e+3]

epoch 151: avg test  loss 1495.20, bar  test loss 2.755, len  test loss 0.033, col  test loss 137.279


Epoch 152: 272batch [00:19, 13.87batch/s, loss=1.62e+3]


epoch 152: avg train loss 1479.24, bar train loss 2.641, len train loss 0.030, col train loss 135.785


Epoch 153: 2batch [00:00, 14.08batch/s, loss=1.46e+3]

epoch 152: avg test  loss 1496.91, bar  test loss 2.831, len  test loss 0.033, col  test loss 137.430


Epoch 153: 272batch [00:19, 14.04batch/s, loss=1.45e+3]


epoch 153: avg train loss 1478.02, bar train loss 2.647, len train loss 0.031, col train loss 135.607


Epoch 154: 2batch [00:00, 12.90batch/s, loss=1.5e+3]

epoch 153: avg test  loss 1494.95, bar  test loss 2.704, len  test loss 0.032, col  test loss 137.212


Epoch 154: 272batch [00:20, 13.54batch/s, loss=1.53e+3]


epoch 154: avg train loss 1477.32, bar train loss 2.627, len train loss 0.030, col train loss 135.538


Epoch 155: 2batch [00:00, 13.89batch/s, loss=1.49e+3]

epoch 154: avg test  loss 1492.12, bar  test loss 2.760, len  test loss 0.032, col  test loss 137.007


Epoch 155: 272batch [00:19, 13.70batch/s, loss=1.52e+3]


epoch 155: avg train loss 1476.26, bar train loss 2.632, len train loss 0.031, col train loss 135.395
epoch 155: avg test  loss 1491.74, bar  test loss 2.753, len  test loss 0.033, col  test loss 136.883


Epoch 156: 272batch [00:20, 13.59batch/s, loss=1.49e+3]


epoch 156: avg train loss 1475.27, bar train loss 2.627, len train loss 0.030, col train loss 135.254


Epoch 157: 2batch [00:00, 13.70batch/s, loss=1.5e+3]

epoch 156: avg test  loss 1495.21, bar  test loss 2.706, len  test loss 0.037, col  test loss 137.211


Epoch 157: 272batch [00:19, 13.74batch/s, loss=1.39e+3]


epoch 157: avg train loss 1474.41, bar train loss 2.622, len train loss 0.030, col train loss 135.155


Epoch 158: 2batch [00:00, 13.89batch/s, loss=1.48e+3]

epoch 157: avg test  loss 1492.61, bar  test loss 2.906, len  test loss 0.031, col  test loss 136.837


Epoch 158: 272batch [00:19, 13.73batch/s, loss=1.53e+3]


epoch 158: avg train loss 1474.16, bar train loss 2.634, len train loss 0.030, col train loss 135.083


Epoch 159: 2batch [00:00, 13.89batch/s, loss=1.47e+3]

epoch 158: avg test  loss 1489.64, bar  test loss 2.725, len  test loss 0.032, col  test loss 136.718


Epoch 159: 272batch [00:19, 13.72batch/s, loss=1.31e+3]


epoch 159: avg train loss 1473.02, bar train loss 2.626, len train loss 0.030, col train loss 134.956


Epoch 160: 2batch [00:00, 13.89batch/s, loss=1.39e+3]

epoch 159: avg test  loss 1489.64, bar  test loss 2.772, len  test loss 0.032, col  test loss 136.698


Epoch 160: 272batch [00:19, 13.69batch/s, loss=1.56e+3]


epoch 160: avg train loss 1472.02, bar train loss 2.610, len train loss 0.031, col train loss 134.830
epoch 160: avg test  loss 1488.97, bar  test loss 2.746, len  test loss 0.030, col  test loss 136.521


Epoch 161: 272batch [00:20, 13.54batch/s, loss=1.55e+3]


epoch 161: avg train loss 1471.16, bar train loss 2.622, len train loss 0.029, col train loss 134.711


Epoch 162: 2batch [00:00, 13.89batch/s, loss=1.46e+3]

epoch 161: avg test  loss 1488.31, bar  test loss 2.681, len  test loss 0.032, col  test loss 136.311


Epoch 162: 272batch [00:19, 13.67batch/s, loss=1.41e+3]


epoch 162: avg train loss 1470.40, bar train loss 2.610, len train loss 0.030, col train loss 134.612


Epoch 163: 2batch [00:00, 13.70batch/s, loss=1.4e+3]

epoch 162: avg test  loss 1488.47, bar  test loss 2.689, len  test loss 0.031, col  test loss 136.429


Epoch 163: 272batch [00:19, 13.64batch/s, loss=1.42e+3]


epoch 163: avg train loss 1469.80, bar train loss 2.611, len train loss 0.030, col train loss 134.539


Epoch 164: 2batch [00:00, 13.61batch/s, loss=1.43e+3]

epoch 163: avg test  loss 1487.22, bar  test loss 2.707, len  test loss 0.032, col  test loss 136.224


Epoch 164: 272batch [00:19, 13.68batch/s, loss=1.5e+3] 


epoch 164: avg train loss 1469.29, bar train loss 2.609, len train loss 0.030, col train loss 134.465


Epoch 165: 2batch [00:00, 13.89batch/s, loss=1.48e+3]

epoch 164: avg test  loss 1484.82, bar  test loss 2.713, len  test loss 0.033, col  test loss 136.094


Epoch 165: 272batch [00:20, 13.44batch/s, loss=1.6e+3] 


epoch 165: avg train loss 1468.66, bar train loss 2.605, len train loss 0.030, col train loss 134.377
epoch 165: avg test  loss 1486.45, bar  test loss 2.718, len  test loss 0.039, col  test loss 136.346


Epoch 166: 272batch [00:20, 13.43batch/s, loss=1.43e+3]


epoch 166: avg train loss 1467.45, bar train loss 2.599, len train loss 0.030, col train loss 134.222


Epoch 167: 2batch [00:00, 14.18batch/s, loss=1.48e+3]

epoch 166: avg test  loss 1484.56, bar  test loss 2.680, len  test loss 0.031, col  test loss 135.671


Epoch 167: 272batch [00:19, 13.71batch/s, loss=1.49e+3]


epoch 167: avg train loss 1466.78, bar train loss 2.599, len train loss 0.030, col train loss 134.143


Epoch 168: 2batch [00:00, 13.89batch/s, loss=1.51e+3]

epoch 167: avg test  loss 1484.32, bar  test loss 2.715, len  test loss 0.031, col  test loss 135.593


Epoch 168: 272batch [00:19, 13.64batch/s, loss=1.43e+3]


epoch 168: avg train loss 1466.21, bar train loss 2.593, len train loss 0.029, col train loss 134.028


Epoch 169: 2batch [00:00, 13.79batch/s, loss=1.5e+3]

epoch 168: avg test  loss 1483.84, bar  test loss 2.704, len  test loss 0.031, col  test loss 135.556


Epoch 169: 272batch [00:19, 13.69batch/s, loss=1.45e+3]


epoch 169: avg train loss 1465.37, bar train loss 2.595, len train loss 0.030, col train loss 133.939


Epoch 170: 2batch [00:00, 13.61batch/s, loss=1.48e+3]

epoch 169: avg test  loss 1482.69, bar  test loss 2.761, len  test loss 0.031, col  test loss 135.592


Epoch 170: 272batch [00:19, 13.63batch/s, loss=1.42e+3]


epoch 170: avg train loss 1464.42, bar train loss 2.592, len train loss 0.030, col train loss 133.823
epoch 170: avg test  loss 1482.41, bar  test loss 2.690, len  test loss 0.032, col  test loss 135.523


Epoch 171: 272batch [00:20, 13.49batch/s, loss=1.57e+3]


epoch 171: avg train loss 1463.52, bar train loss 2.575, len train loss 0.029, col train loss 133.730


Epoch 172: 2batch [00:00, 13.51batch/s, loss=1.5e+3]

epoch 171: avg test  loss 1481.42, bar  test loss 2.769, len  test loss 0.032, col  test loss 135.662


Epoch 172: 272batch [00:19, 13.62batch/s, loss=1.46e+3]


epoch 172: avg train loss 1463.48, bar train loss 2.583, len train loss 0.029, col train loss 133.712


Epoch 173: 2batch [00:00, 13.25batch/s, loss=1.46e+3]

epoch 172: avg test  loss 1482.78, bar  test loss 2.729, len  test loss 0.031, col  test loss 135.693


Epoch 173: 272batch [00:19, 13.64batch/s, loss=1.46e+3]


epoch 173: avg train loss 1462.84, bar train loss 2.588, len train loss 0.030, col train loss 133.601


Epoch 174: 2batch [00:00, 13.61batch/s, loss=1.47e+3]

epoch 173: avg test  loss 1480.45, bar  test loss 2.718, len  test loss 0.036, col  test loss 135.294


Epoch 174: 272batch [00:20, 13.58batch/s, loss=1.58e+3]


epoch 174: avg train loss 1462.18, bar train loss 2.577, len train loss 0.029, col train loss 133.518


Epoch 175: 2batch [00:00, 13.51batch/s, loss=1.45e+3]

epoch 174: avg test  loss 1479.84, bar  test loss 2.666, len  test loss 0.030, col  test loss 135.239


Epoch 175: 272batch [00:20, 13.52batch/s, loss=1.46e+3]


epoch 175: avg train loss 1461.43, bar train loss 2.566, len train loss 0.030, col train loss 133.433
epoch 175: avg test  loss 1480.12, bar  test loss 2.710, len  test loss 0.031, col  test loss 135.257


Epoch 176: 272batch [00:20, 13.24batch/s, loss=1.54e+3]


epoch 176: avg train loss 1460.94, bar train loss 2.570, len train loss 0.029, col train loss 133.329


Epoch 177: 2batch [00:00, 13.51batch/s, loss=1.43e+3]

epoch 176: avg test  loss 1480.00, bar  test loss 2.727, len  test loss 0.030, col  test loss 135.152


Epoch 177: 272batch [00:20, 13.35batch/s, loss=1.53e+3]


epoch 177: avg train loss 1460.18, bar train loss 2.566, len train loss 0.029, col train loss 133.261


Epoch 178: 2batch [00:00, 13.24batch/s, loss=1.44e+3]

epoch 177: avg test  loss 1477.72, bar  test loss 2.644, len  test loss 0.030, col  test loss 134.683


Epoch 178: 272batch [00:20, 13.54batch/s, loss=1.52e+3]


epoch 178: avg train loss 1459.54, bar train loss 2.552, len train loss 0.030, col train loss 133.172


Epoch 179: 2batch [00:00, 13.25batch/s, loss=1.42e+3]

epoch 178: avg test  loss 1477.66, bar  test loss 2.685, len  test loss 0.034, col  test loss 135.105


Epoch 179: 272batch [00:20, 13.60batch/s, loss=1.54e+3]


epoch 179: avg train loss 1458.56, bar train loss 2.546, len train loss 0.029, col train loss 133.071


Epoch 180: 2batch [00:00, 14.08batch/s, loss=1.45e+3]

epoch 179: avg test  loss 1478.04, bar  test loss 2.663, len  test loss 0.033, col  test loss 134.969


Epoch 180: 272batch [00:20, 13.47batch/s, loss=1.51e+3]


epoch 180: avg train loss 1458.23, bar train loss 2.547, len train loss 0.029, col train loss 133.018
epoch 180: avg test  loss 1478.45, bar  test loss 2.746, len  test loss 0.038, col  test loss 135.001


Epoch 181: 272batch [00:20, 13.39batch/s, loss=1.43e+3]


epoch 181: avg train loss 1457.86, bar train loss 2.549, len train loss 0.029, col train loss 132.957


Epoch 182: 2batch [00:00, 13.16batch/s, loss=1.54e+3]

epoch 181: avg test  loss 1476.78, bar  test loss 2.664, len  test loss 0.034, col  test loss 134.653


Epoch 182: 272batch [00:20, 13.35batch/s, loss=1.33e+3]


epoch 182: avg train loss 1456.81, bar train loss 2.551, len train loss 0.029, col train loss 132.835


Epoch 183: 2batch [00:00, 13.70batch/s, loss=1.5e+3]

epoch 182: avg test  loss 1475.93, bar  test loss 2.617, len  test loss 0.032, col  test loss 134.746


Epoch 183: 272batch [00:19, 13.62batch/s, loss=1.58e+3]


epoch 183: avg train loss 1456.51, bar train loss 2.550, len train loss 0.029, col train loss 132.784


Epoch 184: 2batch [00:00, 13.51batch/s, loss=1.48e+3]

epoch 183: avg test  loss 1475.55, bar  test loss 2.677, len  test loss 0.030, col  test loss 134.484


Epoch 184: 272batch [00:20, 13.57batch/s, loss=1.55e+3]


epoch 184: avg train loss 1456.28, bar train loss 2.551, len train loss 0.029, col train loss 132.744


Epoch 185: 2batch [00:00, 13.25batch/s, loss=1.46e+3]

epoch 184: avg test  loss 1474.96, bar  test loss 2.706, len  test loss 0.036, col  test loss 134.601


Epoch 185: 272batch [00:20, 13.57batch/s, loss=1.37e+3]


epoch 185: avg train loss 1455.14, bar train loss 2.537, len train loss 0.029, col train loss 132.633
epoch 185: avg test  loss 1474.91, bar  test loss 2.640, len  test loss 0.030, col  test loss 134.550


Epoch 186: 272batch [00:20, 13.39batch/s, loss=1.5e+3] 


epoch 186: avg train loss 1455.21, bar train loss 2.537, len train loss 0.029, col train loss 132.593


Epoch 187: 2batch [00:00, 13.70batch/s, loss=1.49e+3]

epoch 186: avg test  loss 1475.70, bar  test loss 2.668, len  test loss 0.032, col  test loss 134.562


Epoch 187: 272batch [00:20, 13.38batch/s, loss=1.5e+3] 


epoch 187: avg train loss 1454.79, bar train loss 2.533, len train loss 0.028, col train loss 132.568


Epoch 188: 2batch [00:00, 13.42batch/s, loss=1.49e+3]

epoch 187: avg test  loss 1474.33, bar  test loss 2.644, len  test loss 0.034, col  test loss 134.222


Epoch 188: 272batch [00:20, 13.39batch/s, loss=1.62e+3]


epoch 188: avg train loss 1454.05, bar train loss 2.535, len train loss 0.029, col train loss 132.438


Epoch 189: 2batch [00:00, 13.99batch/s, loss=1.44e+3]

epoch 188: avg test  loss 1471.29, bar  test loss 2.640, len  test loss 0.030, col  test loss 134.172


Epoch 189: 272batch [00:20, 13.53batch/s, loss=1.27e+3]


epoch 189: avg train loss 1453.43, bar train loss 2.521, len train loss 0.029, col train loss 132.383


Epoch 190: 2batch [00:00, 13.89batch/s, loss=1.44e+3]

epoch 189: avg test  loss 1473.09, bar  test loss 2.752, len  test loss 0.031, col  test loss 134.420


Epoch 190: 272batch [00:20, 13.53batch/s, loss=1.47e+3]


epoch 190: avg train loss 1452.68, bar train loss 2.535, len train loss 0.028, col train loss 132.274
epoch 190: avg test  loss 1472.22, bar  test loss 2.633, len  test loss 0.032, col  test loss 134.362


Epoch 191: 272batch [00:20, 13.34batch/s, loss=1.37e+3]


epoch 191: avg train loss 1452.54, bar train loss 2.521, len train loss 0.029, col train loss 132.261


Epoch 192: 2batch [00:00, 13.42batch/s, loss=1.45e+3]

epoch 191: avg test  loss 1472.07, bar  test loss 2.580, len  test loss 0.030, col  test loss 133.989


Epoch 192: 272batch [00:20, 13.48batch/s, loss=1.48e+3]


epoch 192: avg train loss 1451.74, bar train loss 2.521, len train loss 0.028, col train loss 132.187


Epoch 193: 2batch [00:00, 13.70batch/s, loss=1.48e+3]

epoch 192: avg test  loss 1471.97, bar  test loss 2.680, len  test loss 0.035, col  test loss 134.131


Epoch 193: 272batch [00:20, 13.52batch/s, loss=1.47e+3]


epoch 193: avg train loss 1451.09, bar train loss 2.514, len train loss 0.028, col train loss 132.070


Epoch 194: 2batch [00:00, 13.70batch/s, loss=1.51e+3]

epoch 193: avg test  loss 1469.77, bar  test loss 2.601, len  test loss 0.030, col  test loss 133.920


Epoch 194: 272batch [00:20, 13.50batch/s, loss=1.49e+3]


epoch 194: avg train loss 1450.88, bar train loss 2.513, len train loss 0.029, col train loss 132.029


Epoch 195: 2batch [00:00, 13.61batch/s, loss=1.53e+3]

epoch 194: avg test  loss 1471.12, bar  test loss 2.645, len  test loss 0.029, col  test loss 134.107


Epoch 195: 272batch [00:20, 13.42batch/s, loss=1.51e+3]


epoch 195: avg train loss 1449.81, bar train loss 2.506, len train loss 0.028, col train loss 131.932
epoch 195: avg test  loss 1472.38, bar  test loss 2.654, len  test loss 0.034, col  test loss 134.013


Epoch 196: 272batch [00:20, 13.34batch/s, loss=1.5e+3] 


epoch 196: avg train loss 1449.70, bar train loss 2.505, len train loss 0.029, col train loss 131.914


Epoch 197: 2batch [00:00, 13.79batch/s, loss=1.45e+3]

epoch 196: avg test  loss 1470.39, bar  test loss 2.606, len  test loss 0.030, col  test loss 133.958


Epoch 197: 272batch [00:20, 13.49batch/s, loss=1.34e+3]


epoch 197: avg train loss 1449.18, bar train loss 2.504, len train loss 0.029, col train loss 131.832


Epoch 198: 2batch [00:00, 12.74batch/s, loss=1.49e+3]

epoch 197: avg test  loss 1469.67, bar  test loss 2.652, len  test loss 0.030, col  test loss 134.157


Epoch 198: 272batch [00:20, 13.46batch/s, loss=1.43e+3]


epoch 198: avg train loss 1448.67, bar train loss 2.500, len train loss 0.028, col train loss 131.767


Epoch 199: 2batch [00:00, 12.90batch/s, loss=1.47e+3]

epoch 198: avg test  loss 1469.04, bar  test loss 2.620, len  test loss 0.031, col  test loss 133.732


Epoch 199: 272batch [00:20, 13.44batch/s, loss=1.58e+3]


epoch 199: avg train loss 1448.17, bar train loss 2.503, len train loss 0.028, col train loss 131.680


Epoch 200: 2batch [00:00, 13.33batch/s, loss=1.47e+3]

epoch 199: avg test  loss 1467.73, bar  test loss 2.610, len  test loss 0.031, col  test loss 133.465


Epoch 200: 272batch [00:20, 13.30batch/s, loss=1.46e+3]


epoch 200: avg train loss 1447.88, bar train loss 2.491, len train loss 0.028, col train loss 131.660
epoch 200: avg test  loss 1468.55, bar  test loss 2.690, len  test loss 0.032, col  test loss 133.848


Epoch 201: 272batch [00:20, 13.09batch/s, loss=1.33e+3]


epoch 201: avg train loss 1447.54, bar train loss 2.504, len train loss 0.028, col train loss 131.626


Epoch 202: 2batch [00:00, 13.70batch/s, loss=1.43e+3]

epoch 201: avg test  loss 1468.09, bar  test loss 2.657, len  test loss 0.032, col  test loss 133.732


Epoch 202: 272batch [00:20, 13.48batch/s, loss=1.45e+3]


epoch 202: avg train loss 1446.85, bar train loss 2.485, len train loss 0.028, col train loss 131.538


Epoch 203: 2batch [00:00, 13.61batch/s, loss=1.46e+3]

epoch 202: avg test  loss 1466.95, bar  test loss 2.614, len  test loss 0.030, col  test loss 133.437


Epoch 203: 272batch [00:20, 13.38batch/s, loss=1.61e+3]


epoch 203: avg train loss 1446.28, bar train loss 2.490, len train loss 0.029, col train loss 131.465


Epoch 204: 2batch [00:00, 13.79batch/s, loss=1.43e+3]

epoch 203: avg test  loss 1468.04, bar  test loss 2.621, len  test loss 0.032, col  test loss 133.593


Epoch 204: 272batch [00:20, 13.43batch/s, loss=1.6e+3] 


epoch 204: avg train loss 1446.08, bar train loss 2.485, len train loss 0.029, col train loss 131.425


Epoch 205: 2batch [00:00, 13.42batch/s, loss=1.47e+3]

epoch 204: avg test  loss 1467.02, bar  test loss 2.610, len  test loss 0.036, col  test loss 133.364


Epoch 205: 272batch [00:20, 13.35batch/s, loss=1.49e+3]


epoch 205: avg train loss 1445.53, bar train loss 2.493, len train loss 0.028, col train loss 131.358
epoch 205: avg test  loss 1467.53, bar  test loss 2.614, len  test loss 0.032, col  test loss 133.483


Epoch 206: 272batch [00:20, 13.02batch/s, loss=1.41e+3]


epoch 206: avg train loss 1445.22, bar train loss 2.485, len train loss 0.028, col train loss 131.305


Epoch 207: 2batch [00:00, 13.33batch/s, loss=1.38e+3]

epoch 206: avg test  loss 1465.73, bar  test loss 2.582, len  test loss 0.030, col  test loss 133.143


Epoch 207: 272batch [00:20, 13.43batch/s, loss=1.4e+3] 


epoch 207: avg train loss 1444.43, bar train loss 2.475, len train loss 0.028, col train loss 131.245


Epoch 208: 2batch [00:00, 13.51batch/s, loss=1.43e+3]

epoch 207: avg test  loss 1464.02, bar  test loss 2.596, len  test loss 0.030, col  test loss 133.077


Epoch 208: 272batch [00:20, 13.38batch/s, loss=1.53e+3]


epoch 208: avg train loss 1443.88, bar train loss 2.472, len train loss 0.028, col train loss 131.149


Epoch 209: 2batch [00:00, 13.70batch/s, loss=1.46e+3]

epoch 208: avg test  loss 1465.33, bar  test loss 2.582, len  test loss 0.031, col  test loss 133.335


Epoch 209: 272batch [00:20, 13.39batch/s, loss=1.46e+3]


epoch 209: avg train loss 1443.47, bar train loss 2.477, len train loss 0.028, col train loss 131.135


Epoch 210: 2batch [00:00, 13.16batch/s, loss=1.43e+3]

epoch 209: avg test  loss 1463.57, bar  test loss 2.606, len  test loss 0.031, col  test loss 132.952


Epoch 210: 272batch [00:20, 13.40batch/s, loss=1.49e+3]


epoch 210: avg train loss 1443.10, bar train loss 2.476, len train loss 0.028, col train loss 131.044
epoch 210: avg test  loss 1464.16, bar  test loss 2.652, len  test loss 0.030, col  test loss 133.404


Epoch 211: 272batch [00:20, 13.08batch/s, loss=1.57e+3]


epoch 211: avg train loss 1442.73, bar train loss 2.466, len train loss 0.028, col train loss 131.008


Epoch 212: 2batch [00:00, 13.07batch/s, loss=1.43e+3]

epoch 211: avg test  loss 1466.34, bar  test loss 2.664, len  test loss 0.030, col  test loss 133.500


Epoch 212: 272batch [00:20, 13.06batch/s, loss=1.41e+3]


epoch 212: avg train loss 1442.01, bar train loss 2.466, len train loss 0.028, col train loss 130.926


Epoch 213: 2batch [00:00, 13.24batch/s, loss=1.48e+3]

epoch 212: avg test  loss 1464.41, bar  test loss 2.580, len  test loss 0.030, col  test loss 132.888


Epoch 213: 272batch [00:20, 13.38batch/s, loss=1.42e+3]


epoch 213: avg train loss 1441.69, bar train loss 2.474, len train loss 0.028, col train loss 130.895


Epoch 214: 2batch [00:00, 13.61batch/s, loss=1.46e+3]

epoch 213: avg test  loss 1462.84, bar  test loss 2.635, len  test loss 0.034, col  test loss 132.854


Epoch 214: 272batch [00:20, 13.36batch/s, loss=1.5e+3] 


epoch 214: avg train loss 1441.85, bar train loss 2.455, len train loss 0.028, col train loss 130.890


Epoch 215: 2batch [00:00, 13.61batch/s, loss=1.48e+3]

epoch 214: avg test  loss 1463.43, bar  test loss 2.560, len  test loss 0.030, col  test loss 132.808


Epoch 215: 272batch [00:20, 13.25batch/s, loss=1.47e+3]


epoch 215: avg train loss 1441.09, bar train loss 2.455, len train loss 0.028, col train loss 130.789
epoch 215: avg test  loss 1464.39, bar  test loss 2.676, len  test loss 0.034, col  test loss 132.871


Epoch 216: 272batch [00:20, 13.15batch/s, loss=1.41e+3]


epoch 216: avg train loss 1440.48, bar train loss 2.458, len train loss 0.028, col train loss 130.743


Epoch 217: 2batch [00:00, 13.51batch/s, loss=1.42e+3]

epoch 216: avg test  loss 1461.55, bar  test loss 2.593, len  test loss 0.030, col  test loss 132.877


Epoch 217: 272batch [00:20, 13.31batch/s, loss=1.28e+3]


epoch 217: avg train loss 1440.12, bar train loss 2.456, len train loss 0.028, col train loss 130.704


Epoch 218: 2batch [00:00, 13.33batch/s, loss=1.45e+3]

epoch 217: avg test  loss 1461.53, bar  test loss 2.555, len  test loss 0.030, col  test loss 132.769


Epoch 218: 272batch [00:20, 13.31batch/s, loss=1.39e+3]


epoch 218: avg train loss 1439.71, bar train loss 2.455, len train loss 0.028, col train loss 130.623


Epoch 219: 2batch [00:00, 13.16batch/s, loss=1.42e+3]

epoch 218: avg test  loss 1460.46, bar  test loss 2.581, len  test loss 0.031, col  test loss 132.738


Epoch 219: 272batch [00:20, 13.32batch/s, loss=1.5e+3] 


epoch 219: avg train loss 1439.49, bar train loss 2.448, len train loss 0.027, col train loss 130.597


Epoch 220: 2batch [00:00, 13.61batch/s, loss=1.43e+3]

epoch 219: avg test  loss 1461.49, bar  test loss 2.636, len  test loss 0.031, col  test loss 132.745


Epoch 220: 272batch [00:20, 13.27batch/s, loss=1.32e+3]


epoch 220: avg train loss 1438.95, bar train loss 2.444, len train loss 0.028, col train loss 130.537
epoch 220: avg test  loss 1461.49, bar  test loss 2.627, len  test loss 0.036, col  test loss 132.709


Epoch 221: 272batch [00:20, 13.07batch/s, loss=1.49e+3]


epoch 221: avg train loss 1438.68, bar train loss 2.446, len train loss 0.028, col train loss 130.507


Epoch 222: 2batch [00:00, 12.99batch/s, loss=1.45e+3]

epoch 221: avg test  loss 1460.81, bar  test loss 2.572, len  test loss 0.030, col  test loss 132.379


Epoch 222: 272batch [00:20, 13.30batch/s, loss=1.51e+3]


epoch 222: avg train loss 1438.44, bar train loss 2.444, len train loss 0.028, col train loss 130.481


Epoch 223: 2batch [00:00, 13.51batch/s, loss=1.44e+3]

epoch 222: avg test  loss 1461.31, bar  test loss 2.608, len  test loss 0.035, col  test loss 132.476


Epoch 223: 272batch [00:20, 13.25batch/s, loss=1.47e+3]


epoch 223: avg train loss 1437.81, bar train loss 2.438, len train loss 0.028, col train loss 130.398


Epoch 224: 2batch [00:00, 13.16batch/s, loss=1.46e+3]

epoch 223: avg test  loss 1459.57, bar  test loss 2.572, len  test loss 0.030, col  test loss 132.556


Epoch 224: 272batch [00:20, 13.28batch/s, loss=1.5e+3] 


epoch 224: avg train loss 1437.40, bar train loss 2.431, len train loss 0.028, col train loss 130.344


Epoch 225: 2batch [00:00, 13.16batch/s, loss=1.51e+3]

epoch 224: avg test  loss 1458.92, bar  test loss 2.547, len  test loss 0.031, col  test loss 132.253


Epoch 225: 272batch [00:20, 13.30batch/s, loss=1.45e+3]


epoch 225: avg train loss 1436.65, bar train loss 2.440, len train loss 0.028, col train loss 130.266
epoch 225: avg test  loss 1458.29, bar  test loss 2.570, len  test loss 0.031, col  test loss 132.503


Epoch 226: 272batch [00:20, 13.06batch/s, loss=1.37e+3]


epoch 226: avg train loss 1436.46, bar train loss 2.434, len train loss 0.028, col train loss 130.263


Epoch 227: 2batch [00:00, 13.51batch/s, loss=1.49e+3]

epoch 226: avg test  loss 1458.78, bar  test loss 2.597, len  test loss 0.030, col  test loss 132.362


Epoch 227: 272batch [00:20, 13.28batch/s, loss=1.44e+3]


epoch 227: avg train loss 1436.17, bar train loss 2.435, len train loss 0.028, col train loss 130.186


Epoch 228: 2batch [00:00, 13.07batch/s, loss=1.47e+3]

epoch 227: avg test  loss 1460.71, bar  test loss 2.615, len  test loss 0.030, col  test loss 132.816


Epoch 228: 272batch [00:20, 13.28batch/s, loss=1.51e+3]


epoch 228: avg train loss 1436.06, bar train loss 2.433, len train loss 0.027, col train loss 130.194


Epoch 229: 2batch [00:00, 13.42batch/s, loss=1.45e+3]

epoch 228: avg test  loss 1457.71, bar  test loss 2.566, len  test loss 0.029, col  test loss 132.410


Epoch 229: 272batch [00:20, 13.10batch/s, loss=1.44e+3]


epoch 229: avg train loss 1435.38, bar train loss 2.425, len train loss 0.027, col train loss 130.124


Epoch 230: 2batch [00:00, 12.35batch/s, loss=1.43e+3]

epoch 229: avg test  loss 1457.01, bar  test loss 2.503, len  test loss 0.031, col  test loss 132.190


Epoch 230: 272batch [00:20, 13.25batch/s, loss=1.41e+3]


epoch 230: avg train loss 1435.46, bar train loss 2.424, len train loss 0.028, col train loss 130.094
epoch 230: avg test  loss 1457.50, bar  test loss 2.563, len  test loss 0.030, col  test loss 132.407


Epoch 231: 272batch [00:20, 12.97batch/s, loss=1.41e+3]


epoch 231: avg train loss 1434.86, bar train loss 2.418, len train loss 0.028, col train loss 130.039


Epoch 232: 2batch [00:00, 13.61batch/s, loss=1.45e+3]

epoch 231: avg test  loss 1457.91, bar  test loss 2.560, len  test loss 0.030, col  test loss 132.237


Epoch 232: 272batch [00:20, 13.02batch/s, loss=1.43e+3]


epoch 232: avg train loss 1434.38, bar train loss 2.414, len train loss 0.027, col train loss 130.000


Epoch 233: 2batch [00:00, 13.51batch/s, loss=1.43e+3]

epoch 232: avg test  loss 1457.64, bar  test loss 2.561, len  test loss 0.033, col  test loss 132.500


Epoch 233: 272batch [00:20, 13.28batch/s, loss=1.42e+3]


epoch 233: avg train loss 1434.11, bar train loss 2.422, len train loss 0.028, col train loss 129.956


Epoch 234: 2batch [00:00, 13.42batch/s, loss=1.43e+3]

epoch 233: avg test  loss 1457.13, bar  test loss 2.521, len  test loss 0.030, col  test loss 132.041


Epoch 234: 272batch [00:20, 13.15batch/s, loss=1.41e+3]


epoch 234: avg train loss 1433.63, bar train loss 2.413, len train loss 0.027, col train loss 129.871


Epoch 235: 2batch [00:00, 13.16batch/s, loss=1.44e+3]

epoch 234: avg test  loss 1456.81, bar  test loss 2.594, len  test loss 0.032, col  test loss 132.274


Epoch 235: 272batch [00:20, 13.25batch/s, loss=1.4e+3] 


epoch 235: avg train loss 1432.59, bar train loss 2.414, len train loss 0.028, col train loss 129.793
epoch 235: avg test  loss 1456.22, bar  test loss 2.536, len  test loss 0.030, col  test loss 132.177


Epoch 236: 272batch [00:20, 12.97batch/s, loss=1.4e+3] 


epoch 236: avg train loss 1433.14, bar train loss 2.414, len train loss 0.027, col train loss 129.808


Epoch 237: 2batch [00:00, 12.90batch/s, loss=1.46e+3]

epoch 236: avg test  loss 1457.27, bar  test loss 2.558, len  test loss 0.031, col  test loss 132.021


Epoch 237: 272batch [00:20, 13.21batch/s, loss=1.44e+3]


epoch 237: avg train loss 1432.61, bar train loss 2.411, len train loss 0.028, col train loss 129.764


Epoch 238: 2batch [00:00, 13.42batch/s, loss=1.47e+3]

epoch 237: avg test  loss 1455.77, bar  test loss 2.513, len  test loss 0.029, col  test loss 131.808


Epoch 238: 272batch [00:20, 13.17batch/s, loss=1.45e+3]


epoch 238: avg train loss 1432.05, bar train loss 2.412, len train loss 0.027, col train loss 129.665


Epoch 239: 2batch [00:00, 13.24batch/s, loss=1.44e+3]

epoch 238: avg test  loss 1455.23, bar  test loss 2.567, len  test loss 0.029, col  test loss 131.806


Epoch 239: 272batch [00:20, 13.28batch/s, loss=1.37e+3]


epoch 239: avg train loss 1431.59, bar train loss 2.403, len train loss 0.027, col train loss 129.636


Epoch 240: 2batch [00:00, 13.25batch/s, loss=1.38e+3]

epoch 239: avg test  loss 1455.36, bar  test loss 2.550, len  test loss 0.029, col  test loss 131.865


Epoch 240: 272batch [00:20, 13.25batch/s, loss=1.35e+3]


epoch 240: avg train loss 1431.47, bar train loss 2.404, len train loss 0.027, col train loss 129.631
epoch 240: avg test  loss 1455.14, bar  test loss 2.592, len  test loss 0.029, col  test loss 131.763


Epoch 241: 272batch [00:21, 12.92batch/s, loss=1.34e+3]


epoch 241: avg train loss 1430.76, bar train loss 2.400, len train loss 0.027, col train loss 129.536


Epoch 242: 2batch [00:00, 13.24batch/s, loss=1.41e+3]

epoch 241: avg test  loss 1455.16, bar  test loss 2.546, len  test loss 0.030, col  test loss 131.974


Epoch 242: 272batch [00:20, 13.14batch/s, loss=1.42e+3]


epoch 242: avg train loss 1430.45, bar train loss 2.398, len train loss 0.027, col train loss 129.515


Epoch 243: 2batch [00:00, 13.51batch/s, loss=1.45e+3]

epoch 242: avg test  loss 1456.25, bar  test loss 2.533, len  test loss 0.029, col  test loss 131.941


Epoch 243: 272batch [00:20, 13.20batch/s, loss=1.35e+3]


epoch 243: avg train loss 1430.30, bar train loss 2.403, len train loss 0.027, col train loss 129.485


Epoch 244: 2batch [00:00, 12.90batch/s, loss=1.46e+3]

epoch 243: avg test  loss 1456.30, bar  test loss 2.534, len  test loss 0.031, col  test loss 132.316


Epoch 244: 272batch [00:20, 13.21batch/s, loss=1.52e+3]


epoch 244: avg train loss 1429.98, bar train loss 2.399, len train loss 0.027, col train loss 129.441


Epoch 245: 2batch [00:00, 13.24batch/s, loss=1.46e+3]

epoch 244: avg test  loss 1454.60, bar  test loss 2.501, len  test loss 0.030, col  test loss 131.675


Epoch 245: 272batch [00:20, 13.21batch/s, loss=1.5e+3] 


epoch 245: avg train loss 1429.18, bar train loss 2.389, len train loss 0.027, col train loss 129.375
epoch 245: avg test  loss 1453.41, bar  test loss 2.513, len  test loss 0.029, col  test loss 131.559


Epoch 246: 272batch [00:21, 12.89batch/s, loss=1.39e+3]


epoch 246: avg train loss 1429.32, bar train loss 2.400, len train loss 0.027, col train loss 129.359


Epoch 247: 2batch [00:00, 13.42batch/s, loss=1.44e+3]

epoch 246: avg test  loss 1455.22, bar  test loss 2.593, len  test loss 0.030, col  test loss 131.892


Epoch 247: 272batch [00:20, 13.20batch/s, loss=1.42e+3]


epoch 247: avg train loss 1429.10, bar train loss 2.390, len train loss 0.027, col train loss 129.356


Epoch 248: 2batch [00:00, 13.61batch/s, loss=1.43e+3]

epoch 247: avg test  loss 1456.00, bar  test loss 2.555, len  test loss 0.030, col  test loss 132.092


Epoch 248: 272batch [00:20, 13.14batch/s, loss=1.41e+3]


epoch 248: avg train loss 1428.86, bar train loss 2.387, len train loss 0.027, col train loss 129.290


Epoch 249: 2batch [00:00, 12.99batch/s, loss=1.41e+3]

epoch 248: avg test  loss 1454.59, bar  test loss 2.516, len  test loss 0.030, col  test loss 132.075


Epoch 249: 272batch [00:20, 13.17batch/s, loss=1.35e+3]


epoch 249: avg train loss 1428.20, bar train loss 2.393, len train loss 0.027, col train loss 129.245


Epoch 250: 2batch [00:00, 13.16batch/s, loss=1.46e+3]

epoch 249: avg test  loss 1454.20, bar  test loss 2.517, len  test loss 0.030, col  test loss 131.988


Epoch 250: 272batch [00:20, 13.13batch/s, loss=1.49e+3]


epoch 250: avg train loss 1427.98, bar train loss 2.386, len train loss 0.027, col train loss 129.217
epoch 250: avg test  loss 1452.33, bar  test loss 2.508, len  test loss 0.033, col  test loss 131.421


Epoch 251: 272batch [00:21, 12.80batch/s, loss=1.49e+3]


epoch 251: avg train loss 1427.59, bar train loss 2.380, len train loss 0.028, col train loss 129.159


Epoch 252: 2batch [00:00, 13.42batch/s, loss=1.44e+3]

epoch 251: avg test  loss 1452.07, bar  test loss 2.531, len  test loss 0.030, col  test loss 131.537


Epoch 252: 272batch [00:20, 13.16batch/s, loss=1.5e+3] 


epoch 252: avg train loss 1427.28, bar train loss 2.385, len train loss 0.027, col train loss 129.091


Epoch 253: 2batch [00:00, 13.07batch/s, loss=1.45e+3]

epoch 252: avg test  loss 1451.74, bar  test loss 2.499, len  test loss 0.030, col  test loss 131.572


Epoch 253: 272batch [00:20, 13.14batch/s, loss=1.57e+3]


epoch 253: avg train loss 1427.17, bar train loss 2.388, len train loss 0.027, col train loss 129.098


Epoch 254: 2batch [00:00, 12.74batch/s, loss=1.48e+3]

epoch 253: avg test  loss 1451.70, bar  test loss 2.542, len  test loss 0.029, col  test loss 131.239


Epoch 254: 272batch [00:20, 13.16batch/s, loss=1.34e+3]


epoch 254: avg train loss 1426.85, bar train loss 2.379, len train loss 0.027, col train loss 129.065


Epoch 255: 2batch [00:00, 13.61batch/s, loss=1.46e+3]

epoch 254: avg test  loss 1451.03, bar  test loss 2.525, len  test loss 0.031, col  test loss 131.328


Epoch 255: 272batch [00:20, 13.14batch/s, loss=1.53e+3]


epoch 255: avg train loss 1426.59, bar train loss 2.382, len train loss 0.027, col train loss 129.009
epoch 255: avg test  loss 1451.13, bar  test loss 2.492, len  test loss 0.032, col  test loss 131.263


Epoch 256: 272batch [00:21, 12.81batch/s, loss=1.45e+3]


epoch 256: avg train loss 1426.07, bar train loss 2.378, len train loss 0.028, col train loss 128.954


Epoch 257: 2batch [00:00, 13.16batch/s, loss=1.45e+3]

epoch 256: avg test  loss 1452.21, bar  test loss 2.673, len  test loss 0.029, col  test loss 131.386


Epoch 257: 272batch [00:20, 13.12batch/s, loss=1.35e+3]


epoch 257: avg train loss 1426.20, bar train loss 2.381, len train loss 0.027, col train loss 128.957


Epoch 258: 2batch [00:00, 13.07batch/s, loss=1.42e+3]

epoch 257: avg test  loss 1451.76, bar  test loss 2.599, len  test loss 0.038, col  test loss 131.420


Epoch 258: 272batch [00:20, 13.07batch/s, loss=1.39e+3]


epoch 258: avg train loss 1425.76, bar train loss 2.378, len train loss 0.027, col train loss 128.920


Epoch 259: 2batch [00:00, 13.07batch/s, loss=1.46e+3]

epoch 258: avg test  loss 1450.23, bar  test loss 2.458, len  test loss 0.032, col  test loss 131.327


Epoch 259: 272batch [00:20, 13.11batch/s, loss=1.31e+3]


epoch 259: avg train loss 1424.86, bar train loss 2.374, len train loss 0.027, col train loss 128.826


Epoch 260: 2batch [00:00, 13.16batch/s, loss=1.4e+3]

epoch 259: avg test  loss 1452.09, bar  test loss 2.531, len  test loss 0.028, col  test loss 131.312


Epoch 260: 272batch [00:20, 13.08batch/s, loss=1.49e+3]


epoch 260: avg train loss 1425.05, bar train loss 2.377, len train loss 0.027, col train loss 128.858
epoch 260: avg test  loss 1449.60, bar  test loss 2.518, len  test loss 0.029, col  test loss 131.365


Epoch 261: 272batch [00:21, 12.73batch/s, loss=1.39e+3]


epoch 261: avg train loss 1424.99, bar train loss 2.384, len train loss 0.027, col train loss 128.836


Epoch 262: 2batch [00:00, 13.25batch/s, loss=1.45e+3]

epoch 261: avg test  loss 1451.31, bar  test loss 2.625, len  test loss 0.033, col  test loss 131.509


Epoch 262: 272batch [00:20, 13.11batch/s, loss=1.28e+3]


epoch 262: avg train loss 1424.39, bar train loss 2.367, len train loss 0.027, col train loss 128.771


Epoch 263: 2batch [00:00, 12.99batch/s, loss=1.41e+3]

epoch 262: avg test  loss 1452.56, bar  test loss 2.553, len  test loss 0.030, col  test loss 131.496


Epoch 263: 272batch [00:20, 13.01batch/s, loss=1.38e+3]


epoch 263: avg train loss 1424.36, bar train loss 2.370, len train loss 0.027, col train loss 128.720


Epoch 264: 2batch [00:00, 13.07batch/s, loss=1.5e+3]

epoch 263: avg test  loss 1449.12, bar  test loss 2.518, len  test loss 0.030, col  test loss 131.078


Epoch 264: 272batch [00:21, 12.63batch/s, loss=1.51e+3]


epoch 264: avg train loss 1423.73, bar train loss 2.367, len train loss 0.026, col train loss 128.682


Epoch 265: 2batch [00:00, 12.90batch/s, loss=1.41e+3]

epoch 264: avg test  loss 1449.20, bar  test loss 2.519, len  test loss 0.035, col  test loss 131.228


Epoch 265: 272batch [00:20, 13.00batch/s, loss=1.45e+3]


epoch 265: avg train loss 1422.98, bar train loss 2.361, len train loss 0.027, col train loss 128.604
epoch 265: avg test  loss 1448.71, bar  test loss 2.540, len  test loss 0.029, col  test loss 131.248


Epoch 266: 272batch [00:21, 12.71batch/s, loss=1.44e+3]


epoch 266: avg train loss 1423.10, bar train loss 2.367, len train loss 0.027, col train loss 128.638


Epoch 267: 2batch [00:00, 13.25batch/s, loss=1.43e+3]

epoch 266: avg test  loss 1447.92, bar  test loss 2.501, len  test loss 0.033, col  test loss 130.898


Epoch 267: 272batch [00:20, 13.03batch/s, loss=1.42e+3]


epoch 267: avg train loss 1423.11, bar train loss 2.371, len train loss 0.027, col train loss 128.593


Epoch 268: 2batch [00:00, 13.33batch/s, loss=1.44e+3]

epoch 267: avg test  loss 1448.03, bar  test loss 2.529, len  test loss 0.032, col  test loss 131.152


Epoch 268: 272batch [00:20, 13.09batch/s, loss=1.44e+3]


epoch 268: avg train loss 1422.62, bar train loss 2.358, len train loss 0.027, col train loss 128.538


Epoch 269: 2batch [00:00, 13.33batch/s, loss=1.43e+3]

epoch 268: avg test  loss 1449.12, bar  test loss 2.544, len  test loss 0.030, col  test loss 131.138


Epoch 269: 272batch [00:20, 13.03batch/s, loss=1.41e+3]


epoch 269: avg train loss 1422.02, bar train loss 2.356, len train loss 0.027, col train loss 128.496


Epoch 270: 2batch [00:00, 13.16batch/s, loss=1.37e+3]

epoch 269: avg test  loss 1448.00, bar  test loss 2.546, len  test loss 0.029, col  test loss 131.124


Epoch 270: 272batch [00:20, 12.98batch/s, loss=1.38e+3]


epoch 270: avg train loss 1422.05, bar train loss 2.353, len train loss 0.027, col train loss 128.472
epoch 270: avg test  loss 1447.99, bar  test loss 2.465, len  test loss 0.029, col  test loss 130.944


Epoch 271: 272batch [00:21, 12.64batch/s, loss=1.39e+3]


epoch 271: avg train loss 1421.94, bar train loss 2.356, len train loss 0.027, col train loss 128.471


Epoch 272: 2batch [00:00, 13.25batch/s, loss=1.41e+3]

epoch 271: avg test  loss 1447.28, bar  test loss 2.482, len  test loss 0.028, col  test loss 131.096


Epoch 272: 272batch [00:20, 12.96batch/s, loss=1.25e+3]


epoch 272: avg train loss 1421.60, bar train loss 2.343, len train loss 0.027, col train loss 128.422


Epoch 273: 2batch [00:00, 13.33batch/s, loss=1.41e+3]

epoch 272: avg test  loss 1446.90, bar  test loss 2.505, len  test loss 0.030, col  test loss 130.729


Epoch 273: 272batch [00:21, 12.74batch/s, loss=1.38e+3]


epoch 273: avg train loss 1420.84, bar train loss 2.352, len train loss 0.027, col train loss 128.307


Epoch 274: 2batch [00:00, 12.90batch/s, loss=1.49e+3]

epoch 273: avg test  loss 1447.32, bar  test loss 2.516, len  test loss 0.033, col  test loss 130.866


Epoch 274: 272batch [00:21, 12.78batch/s, loss=1.48e+3]


epoch 274: avg train loss 1421.03, bar train loss 2.342, len train loss 0.027, col train loss 128.349


Epoch 275: 2batch [00:00, 13.42batch/s, loss=1.45e+3]

epoch 274: avg test  loss 1450.93, bar  test loss 2.542, len  test loss 0.032, col  test loss 131.390


Epoch 275: 272batch [00:20, 12.99batch/s, loss=1.36e+3]


epoch 275: avg train loss 1420.94, bar train loss 2.353, len train loss 0.027, col train loss 128.310
epoch 275: avg test  loss 1447.09, bar  test loss 2.579, len  test loss 0.030, col  test loss 130.929


Epoch 276: 272batch [00:22, 12.22batch/s, loss=1.46e+3]


epoch 276: avg train loss 1420.19, bar train loss 2.345, len train loss 0.026, col train loss 128.272


Epoch 277: 2batch [00:00, 12.66batch/s, loss=1.45e+3]

epoch 276: avg test  loss 1448.93, bar  test loss 2.682, len  test loss 0.031, col  test loss 131.068


Epoch 277: 272batch [00:21, 12.88batch/s, loss=1.54e+3]


epoch 277: avg train loss 1419.95, bar train loss 2.350, len train loss 0.027, col train loss 128.239


Epoch 278: 2batch [00:00, 13.16batch/s, loss=1.47e+3]

epoch 277: avg test  loss 1446.30, bar  test loss 2.540, len  test loss 0.031, col  test loss 130.973


Epoch 278: 272batch [00:21, 12.95batch/s, loss=1.39e+3]


epoch 278: avg train loss 1419.45, bar train loss 2.341, len train loss 0.026, col train loss 128.184


Epoch 279: 2batch [00:00, 12.82batch/s, loss=1.43e+3]

epoch 278: avg test  loss 1448.08, bar  test loss 2.519, len  test loss 0.033, col  test loss 130.685


Epoch 279: 272batch [00:21, 12.84batch/s, loss=1.52e+3]


epoch 279: avg train loss 1419.52, bar train loss 2.349, len train loss 0.027, col train loss 128.159


Epoch 280: 2batch [00:00, 12.99batch/s, loss=1.41e+3]

epoch 279: avg test  loss 1446.72, bar  test loss 2.530, len  test loss 0.029, col  test loss 130.914


Epoch 280: 272batch [00:21, 12.87batch/s, loss=1.43e+3]


epoch 280: avg train loss 1419.20, bar train loss 2.347, len train loss 0.027, col train loss 128.098
epoch 280: avg test  loss 1444.79, bar  test loss 2.524, len  test loss 0.030, col  test loss 130.458


Epoch 281: 272batch [00:21, 12.50batch/s, loss=1.34e+3]


epoch 281: avg train loss 1418.58, bar train loss 2.344, len train loss 0.027, col train loss 128.066


Epoch 282: 2batch [00:00, 13.07batch/s, loss=1.38e+3]

epoch 281: avg test  loss 1445.09, bar  test loss 2.456, len  test loss 0.028, col  test loss 130.639


Epoch 282: 272batch [00:21, 12.81batch/s, loss=1.31e+3]


epoch 282: avg train loss 1418.74, bar train loss 2.341, len train loss 0.026, col train loss 128.052


Epoch 283: 2batch [00:00, 12.99batch/s, loss=1.4e+3]

epoch 282: avg test  loss 1444.98, bar  test loss 2.486, len  test loss 0.029, col  test loss 130.547


Epoch 283: 272batch [00:21, 12.80batch/s, loss=1.41e+3]


epoch 283: avg train loss 1418.06, bar train loss 2.337, len train loss 0.026, col train loss 127.999


Epoch 284: 2batch [00:00, 13.16batch/s, loss=1.39e+3]

epoch 283: avg test  loss 1446.25, bar  test loss 2.535, len  test loss 0.030, col  test loss 130.629


Epoch 284: 272batch [00:21, 12.91batch/s, loss=1.48e+3]


epoch 284: avg train loss 1417.95, bar train loss 2.341, len train loss 0.026, col train loss 127.978


Epoch 285: 2batch [00:00, 12.82batch/s, loss=1.42e+3]

epoch 284: avg test  loss 1445.26, bar  test loss 2.481, len  test loss 0.032, col  test loss 130.756


Epoch 285: 272batch [00:21, 12.86batch/s, loss=1.46e+3]


epoch 285: avg train loss 1417.60, bar train loss 2.338, len train loss 0.026, col train loss 127.915
epoch 285: avg test  loss 1444.42, bar  test loss 2.481, len  test loss 0.028, col  test loss 130.522


Epoch 286: 272batch [00:21, 12.53batch/s, loss=1.38e+3]


epoch 286: avg train loss 1417.62, bar train loss 2.337, len train loss 0.027, col train loss 127.922


Epoch 287: 2batch [00:00, 12.90batch/s, loss=1.35e+3]

epoch 286: avg test  loss 1445.50, bar  test loss 2.489, len  test loss 0.029, col  test loss 130.516


Epoch 287: 272batch [00:21, 12.85batch/s, loss=1.46e+3]


epoch 287: avg train loss 1417.29, bar train loss 2.340, len train loss 0.026, col train loss 127.904


Epoch 288: 2batch [00:00, 12.99batch/s, loss=1.41e+3]

epoch 287: avg test  loss 1444.09, bar  test loss 2.480, len  test loss 0.029, col  test loss 130.541


Epoch 288: 272batch [00:21, 12.79batch/s, loss=1.4e+3] 


epoch 288: avg train loss 1417.01, bar train loss 2.338, len train loss 0.026, col train loss 127.856


Epoch 289: 2batch [00:00, 13.07batch/s, loss=1.4e+3]

epoch 288: avg test  loss 1444.63, bar  test loss 2.542, len  test loss 0.030, col  test loss 130.691


Epoch 289: 272batch [00:21, 12.79batch/s, loss=1.42e+3]


epoch 289: avg train loss 1416.65, bar train loss 2.340, len train loss 0.027, col train loss 127.800


Epoch 290: 2batch [00:00, 13.16batch/s, loss=1.44e+3]

epoch 289: avg test  loss 1443.21, bar  test loss 2.554, len  test loss 0.029, col  test loss 130.431


Epoch 290: 272batch [00:21, 12.81batch/s, loss=1.47e+3]


epoch 290: avg train loss 1416.64, bar train loss 2.341, len train loss 0.026, col train loss 127.822
epoch 290: avg test  loss 1444.90, bar  test loss 2.503, len  test loss 0.029, col  test loss 130.864


Epoch 291: 272batch [00:21, 12.45batch/s, loss=1.49e+3]


epoch 291: avg train loss 1415.89, bar train loss 2.330, len train loss 0.027, col train loss 127.720


Epoch 292: 2batch [00:00, 13.16batch/s, loss=1.45e+3]

epoch 291: avg test  loss 1444.53, bar  test loss 2.501, len  test loss 0.030, col  test loss 130.371


Epoch 292: 272batch [00:21, 12.83batch/s, loss=1.52e+3]


epoch 292: avg train loss 1416.12, bar train loss 2.330, len train loss 0.027, col train loss 127.737


Epoch 293: 2batch [00:00, 13.16batch/s, loss=1.44e+3]

epoch 292: avg test  loss 1444.11, bar  test loss 2.457, len  test loss 0.031, col  test loss 130.212


Epoch 293: 272batch [00:21, 12.83batch/s, loss=1.45e+3]


epoch 293: avg train loss 1415.67, bar train loss 2.335, len train loss 0.026, col train loss 127.677


Epoch 294: 2batch [00:00, 13.25batch/s, loss=1.42e+3]

epoch 293: avg test  loss 1444.02, bar  test loss 2.472, len  test loss 0.030, col  test loss 130.490


Epoch 294: 272batch [00:21, 12.83batch/s, loss=1.34e+3]


epoch 294: avg train loss 1415.75, bar train loss 2.324, len train loss 0.027, col train loss 127.696


Epoch 295: 2batch [00:00, 13.07batch/s, loss=1.42e+3]

epoch 294: avg test  loss 1444.44, bar  test loss 2.498, len  test loss 0.042, col  test loss 130.535


Epoch 295: 272batch [00:21, 12.78batch/s, loss=1.42e+3]


epoch 295: avg train loss 1414.85, bar train loss 2.328, len train loss 0.026, col train loss 127.596
epoch 295: avg test  loss 1443.37, bar  test loss 2.623, len  test loss 0.029, col  test loss 130.265


Epoch 296: 272batch [00:22, 12.36batch/s, loss=1.49e+3]


epoch 296: avg train loss 1414.61, bar train loss 2.337, len train loss 0.026, col train loss 127.561


Epoch 297: 2batch [00:00, 13.16batch/s, loss=1.43e+3]

epoch 296: avg test  loss 1441.74, bar  test loss 2.467, len  test loss 0.028, col  test loss 130.132


Epoch 297: 272batch [00:21, 12.78batch/s, loss=1.42e+3]


epoch 297: avg train loss 1414.97, bar train loss 2.332, len train loss 0.026, col train loss 127.586


Epoch 298: 2batch [00:00, 12.90batch/s, loss=1.42e+3]

epoch 297: avg test  loss 1442.35, bar  test loss 2.522, len  test loss 0.031, col  test loss 130.195


Epoch 298: 272batch [00:21, 12.81batch/s, loss=1.37e+3]


epoch 298: avg train loss 1414.30, bar train loss 2.321, len train loss 0.026, col train loss 127.548


Epoch 299: 2batch [00:00, 13.16batch/s, loss=1.43e+3]

epoch 298: avg test  loss 1443.58, bar  test loss 2.523, len  test loss 0.029, col  test loss 130.370


Epoch 299: 272batch [00:21, 12.76batch/s, loss=1.46e+3]


epoch 299: avg train loss 1414.09, bar train loss 2.323, len train loss 0.027, col train loss 127.491


Epoch 300: 2batch [00:00, 13.42batch/s, loss=1.42e+3]

epoch 299: avg test  loss 1442.67, bar  test loss 2.459, len  test loss 0.030, col  test loss 130.565


Epoch 300: 272batch [00:21, 12.80batch/s, loss=1.39e+3]


epoch 300: avg train loss 1413.48, bar train loss 2.326, len train loss 0.026, col train loss 127.435
epoch 300: avg test  loss 1442.26, bar  test loss 2.479, len  test loss 0.028, col  test loss 130.255


Epoch 301: 272batch [00:22, 12.10batch/s, loss=1.4e+3] 


epoch 301: avg train loss 1413.53, bar train loss 2.329, len train loss 0.027, col train loss 127.438


Epoch 302: 2batch [00:00, 12.99batch/s, loss=1.34e+3]

epoch 301: avg test  loss 1443.11, bar  test loss 2.507, len  test loss 0.031, col  test loss 130.342


Epoch 302: 272batch [00:21, 12.73batch/s, loss=1.4e+3] 


epoch 302: avg train loss 1412.99, bar train loss 2.323, len train loss 0.026, col train loss 127.370


Epoch 303: 2batch [00:00, 12.99batch/s, loss=1.38e+3]

epoch 302: avg test  loss 1440.70, bar  test loss 2.559, len  test loss 0.029, col  test loss 130.186


Epoch 303: 272batch [00:21, 12.73batch/s, loss=1.34e+3]


epoch 303: avg train loss 1413.20, bar train loss 2.326, len train loss 0.026, col train loss 127.365


Epoch 304: 2batch [00:00, 12.58batch/s, loss=1.42e+3]

epoch 303: avg test  loss 1444.11, bar  test loss 2.530, len  test loss 0.034, col  test loss 130.047


Epoch 304: 272batch [00:21, 12.77batch/s, loss=1.26e+3]


epoch 304: avg train loss 1413.54, bar train loss 2.327, len train loss 0.027, col train loss 127.387


Epoch 305: 2batch [00:00, 12.50batch/s, loss=1.39e+3]

epoch 304: avg test  loss 1441.51, bar  test loss 2.498, len  test loss 0.038, col  test loss 130.127


Epoch 305: 272batch [00:21, 12.73batch/s, loss=1.49e+3]


epoch 305: avg train loss 1412.75, bar train loss 2.327, len train loss 0.026, col train loss 127.311
epoch 305: avg test  loss 1440.99, bar  test loss 2.462, len  test loss 0.030, col  test loss 130.179


Epoch 306: 272batch [00:22, 12.26batch/s, loss=1.37e+3]


epoch 306: avg train loss 1411.99, bar train loss 2.311, len train loss 0.026, col train loss 127.244


Epoch 307: 2batch [00:00, 12.50batch/s, loss=1.4e+3]

epoch 306: avg test  loss 1443.19, bar  test loss 2.469, len  test loss 0.032, col  test loss 130.152


Epoch 307: 272batch [00:21, 12.70batch/s, loss=1.43e+3]


epoch 307: avg train loss 1412.41, bar train loss 2.314, len train loss 0.026, col train loss 127.237


Epoch 308: 2batch [00:00, 12.19batch/s, loss=1.38e+3]

epoch 307: avg test  loss 1440.97, bar  test loss 2.499, len  test loss 0.029, col  test loss 130.061


Epoch 308: 272batch [00:21, 12.71batch/s, loss=1.5e+3] 


epoch 308: avg train loss 1411.74, bar train loss 2.326, len train loss 0.026, col train loss 127.203


Epoch 309: 2batch [00:00, 12.82batch/s, loss=1.46e+3]

epoch 308: avg test  loss 1440.46, bar  test loss 2.478, len  test loss 0.032, col  test loss 130.084


Epoch 309: 272batch [00:21, 12.73batch/s, loss=1.42e+3]


epoch 309: avg train loss 1411.42, bar train loss 2.313, len train loss 0.027, col train loss 127.183


Epoch 310: 2batch [00:00, 12.50batch/s, loss=1.44e+3]

epoch 309: avg test  loss 1440.55, bar  test loss 2.564, len  test loss 0.029, col  test loss 129.887


Epoch 310: 272batch [00:21, 12.74batch/s, loss=1.41e+3]


epoch 310: avg train loss 1411.22, bar train loss 2.320, len train loss 0.026, col train loss 127.149
epoch 310: avg test  loss 1439.31, bar  test loss 2.421, len  test loss 0.029, col  test loss 129.842


Epoch 311: 272batch [00:22, 12.27batch/s, loss=1.43e+3]


epoch 311: avg train loss 1410.94, bar train loss 2.312, len train loss 0.026, col train loss 127.091


Epoch 312: 2batch [00:00, 12.90batch/s, loss=1.43e+3]

epoch 311: avg test  loss 1441.51, bar  test loss 2.587, len  test loss 0.032, col  test loss 130.114


Epoch 312: 272batch [00:21, 12.71batch/s, loss=1.44e+3]


epoch 312: avg train loss 1411.13, bar train loss 2.322, len train loss 0.026, col train loss 127.114


Epoch 313: 2batch [00:00, 11.98batch/s, loss=1.43e+3]

epoch 312: avg test  loss 1441.26, bar  test loss 2.514, len  test loss 0.031, col  test loss 130.068


Epoch 313: 272batch [00:21, 12.65batch/s, loss=1.44e+3]


epoch 313: avg train loss 1410.34, bar train loss 2.315, len train loss 0.026, col train loss 127.027


Epoch 314: 2batch [00:00, 13.24batch/s, loss=1.44e+3]

epoch 313: avg test  loss 1438.86, bar  test loss 2.518, len  test loss 0.029, col  test loss 129.641


Epoch 314: 272batch [00:21, 12.68batch/s, loss=1.32e+3]


epoch 314: avg train loss 1409.61, bar train loss 2.312, len train loss 0.026, col train loss 126.951


Epoch 315: 2batch [00:00, 12.99batch/s, loss=1.48e+3]

epoch 314: avg test  loss 1438.68, bar  test loss 2.489, len  test loss 0.028, col  test loss 129.494


Epoch 315: 272batch [00:21, 12.70batch/s, loss=1.43e+3]


epoch 315: avg train loss 1409.52, bar train loss 2.319, len train loss 0.026, col train loss 126.926
epoch 315: avg test  loss 1437.25, bar  test loss 2.482, len  test loss 0.030, col  test loss 129.758


Epoch 316: 272batch [00:22, 12.18batch/s, loss=1.48e+3]


epoch 316: avg train loss 1409.68, bar train loss 2.316, len train loss 0.026, col train loss 126.936


Epoch 317: 2batch [00:00, 13.25batch/s, loss=1.37e+3]

epoch 316: avg test  loss 1438.68, bar  test loss 2.497, len  test loss 0.032, col  test loss 129.942


Epoch 317: 272batch [00:21, 12.65batch/s, loss=1.54e+3]


epoch 317: avg train loss 1409.50, bar train loss 2.322, len train loss 0.026, col train loss 126.888


Epoch 318: 2batch [00:00, 13.16batch/s, loss=1.4e+3]

epoch 317: avg test  loss 1439.52, bar  test loss 2.494, len  test loss 0.029, col  test loss 129.814


Epoch 318: 272batch [00:21, 12.63batch/s, loss=1.31e+3]


epoch 318: avg train loss 1408.96, bar train loss 2.315, len train loss 0.026, col train loss 126.860


Epoch 319: 0batch [00:00, ?batch/s, loss=1.45e+3]

epoch 318: avg test  loss 1437.86, bar  test loss 2.452, len  test loss 0.028, col  test loss 129.798


Epoch 319: 272batch [00:21, 12.57batch/s, loss=1.59e+3]


epoch 319: avg train loss 1408.70, bar train loss 2.307, len train loss 0.026, col train loss 126.824


Epoch 320: 2batch [00:00, 12.82batch/s, loss=1.43e+3]

epoch 319: avg test  loss 1437.38, bar  test loss 2.415, len  test loss 0.028, col  test loss 129.541


Epoch 320: 272batch [00:21, 12.45batch/s, loss=1.56e+3]


epoch 320: avg train loss 1408.37, bar train loss 2.309, len train loss 0.026, col train loss 126.788
epoch 320: avg test  loss 1437.21, bar  test loss 2.481, len  test loss 0.031, col  test loss 129.733


Epoch 321: 272batch [00:22, 12.11batch/s, loss=1.37e+3]


epoch 321: avg train loss 1408.56, bar train loss 2.305, len train loss 0.026, col train loss 126.800


Epoch 322: 2batch [00:00, 11.49batch/s, loss=1.45e+3]

epoch 321: avg test  loss 1436.60, bar  test loss 2.482, len  test loss 0.031, col  test loss 129.688


Epoch 322: 272batch [00:21, 12.60batch/s, loss=1.43e+3]


epoch 322: avg train loss 1407.89, bar train loss 2.308, len train loss 0.026, col train loss 126.726


Epoch 323: 2batch [00:00, 12.90batch/s, loss=1.39e+3]

epoch 322: avg test  loss 1437.18, bar  test loss 2.523, len  test loss 0.028, col  test loss 129.529


Epoch 323: 272batch [00:21, 12.54batch/s, loss=1.37e+3]


epoch 323: avg train loss 1407.48, bar train loss 2.303, len train loss 0.026, col train loss 126.736


Epoch 324: 2batch [00:00, 13.16batch/s, loss=1.41e+3]

epoch 323: avg test  loss 1437.83, bar  test loss 2.496, len  test loss 0.033, col  test loss 129.777


Epoch 324: 272batch [00:21, 12.53batch/s, loss=1.41e+3]


epoch 324: avg train loss 1407.59, bar train loss 2.318, len train loss 0.026, col train loss 126.695


Epoch 325: 2batch [00:00, 12.90batch/s, loss=1.43e+3]

epoch 324: avg test  loss 1436.49, bar  test loss 2.524, len  test loss 0.029, col  test loss 129.591


Epoch 325: 272batch [00:21, 12.59batch/s, loss=1.35e+3]


epoch 325: avg train loss 1407.61, bar train loss 2.305, len train loss 0.025, col train loss 126.692
epoch 325: avg test  loss 1436.05, bar  test loss 2.440, len  test loss 0.029, col  test loss 129.423


Epoch 326: 272batch [00:22, 12.11batch/s, loss=1.24e+3]


epoch 326: avg train loss 1406.96, bar train loss 2.318, len train loss 0.026, col train loss 126.641


Epoch 327: 2batch [00:00, 12.82batch/s, loss=1.42e+3]

epoch 326: avg test  loss 1436.12, bar  test loss 2.480, len  test loss 0.029, col  test loss 129.319


Epoch 327: 272batch [00:21, 12.58batch/s, loss=1.39e+3]


epoch 327: avg train loss 1406.70, bar train loss 2.300, len train loss 0.026, col train loss 126.579


Epoch 328: 2batch [00:00, 12.82batch/s, loss=1.42e+3]

epoch 327: avg test  loss 1434.89, bar  test loss 2.434, len  test loss 0.029, col  test loss 129.292


Epoch 328: 272batch [00:21, 12.56batch/s, loss=1.29e+3]


epoch 328: avg train loss 1407.07, bar train loss 2.298, len train loss 0.026, col train loss 126.639


Epoch 329: 2batch [00:00, 12.66batch/s, loss=1.43e+3]

epoch 328: avg test  loss 1437.48, bar  test loss 2.470, len  test loss 0.030, col  test loss 129.518


Epoch 329: 272batch [00:21, 12.58batch/s, loss=1.44e+3]


epoch 329: avg train loss 1406.21, bar train loss 2.311, len train loss 0.026, col train loss 126.494


Epoch 330: 2batch [00:00, 12.99batch/s, loss=1.43e+3]

epoch 329: avg test  loss 1437.24, bar  test loss 2.481, len  test loss 0.033, col  test loss 129.339


Epoch 330: 272batch [00:21, 12.55batch/s, loss=1.4e+3] 


epoch 330: avg train loss 1405.68, bar train loss 2.307, len train loss 0.025, col train loss 126.478
epoch 330: avg test  loss 1436.03, bar  test loss 2.545, len  test loss 0.029, col  test loss 129.309


Epoch 331: 272batch [00:22, 11.96batch/s, loss=1.47e+3]


epoch 331: avg train loss 1405.81, bar train loss 2.300, len train loss 0.026, col train loss 126.484


Epoch 332: 2batch [00:00, 11.98batch/s, loss=1.47e+3]

epoch 331: avg test  loss 1436.48, bar  test loss 2.513, len  test loss 0.028, col  test loss 129.174


Epoch 332: 272batch [00:21, 12.56batch/s, loss=1.49e+3]


epoch 332: avg train loss 1405.46, bar train loss 2.299, len train loss 0.026, col train loss 126.451


Epoch 333: 2batch [00:00, 12.99batch/s, loss=1.32e+3]

epoch 332: avg test  loss 1434.61, bar  test loss 2.491, len  test loss 0.033, col  test loss 129.316


Epoch 333: 272batch [00:21, 12.50batch/s, loss=1.54e+3]


epoch 333: avg train loss 1405.41, bar train loss 2.305, len train loss 0.026, col train loss 126.420


Epoch 334: 2batch [00:00, 12.42batch/s, loss=1.39e+3]

epoch 333: avg test  loss 1435.45, bar  test loss 2.514, len  test loss 0.029, col  test loss 129.220


Epoch 334: 272batch [00:21, 12.42batch/s, loss=1.55e+3]


epoch 334: avg train loss 1405.09, bar train loss 2.296, len train loss 0.026, col train loss 126.358


Epoch 335: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 334: avg test  loss 1435.96, bar  test loss 2.452, len  test loss 0.029, col  test loss 129.016


Epoch 335: 272batch [00:21, 12.46batch/s, loss=1.43e+3]


epoch 335: avg train loss 1404.53, bar train loss 2.300, len train loss 0.026, col train loss 126.325
epoch 335: avg test  loss 1433.34, bar  test loss 2.474, len  test loss 0.029, col  test loss 128.982


Epoch 336: 272batch [00:22, 12.01batch/s, loss=1.37e+3]


epoch 336: avg train loss 1404.51, bar train loss 2.295, len train loss 0.026, col train loss 126.334


Epoch 337: 2batch [00:00, 12.27batch/s, loss=1.39e+3]

epoch 336: avg test  loss 1436.89, bar  test loss 2.486, len  test loss 0.029, col  test loss 129.435


Epoch 337: 272batch [00:21, 12.44batch/s, loss=1.37e+3]


epoch 337: avg train loss 1404.36, bar train loss 2.304, len train loss 0.026, col train loss 126.303


Epoch 338: 2batch [00:00, 12.66batch/s, loss=1.39e+3]

epoch 337: avg test  loss 1433.80, bar  test loss 2.490, len  test loss 0.029, col  test loss 129.312


Epoch 338: 272batch [00:21, 12.42batch/s, loss=1.37e+3]


epoch 338: avg train loss 1403.80, bar train loss 2.304, len train loss 0.025, col train loss 126.257


Epoch 339: 2batch [00:00, 12.99batch/s, loss=1.43e+3]

epoch 338: avg test  loss 1433.09, bar  test loss 2.539, len  test loss 0.032, col  test loss 128.949


Epoch 339: 272batch [00:21, 12.40batch/s, loss=1.29e+3]


epoch 339: avg train loss 1404.05, bar train loss 2.303, len train loss 0.026, col train loss 126.257


Epoch 340: 2batch [00:00, 12.90batch/s, loss=1.42e+3]

epoch 339: avg test  loss 1434.54, bar  test loss 2.479, len  test loss 0.030, col  test loss 129.401


Epoch 340: 272batch [00:21, 12.38batch/s, loss=1.51e+3]


epoch 340: avg train loss 1403.79, bar train loss 2.309, len train loss 0.026, col train loss 126.211
epoch 340: avg test  loss 1434.73, bar  test loss 2.479, len  test loss 0.027, col  test loss 129.120


Epoch 341: 272batch [00:23, 11.78batch/s, loss=1.42e+3]


epoch 341: avg train loss 1403.22, bar train loss 2.297, len train loss 0.025, col train loss 126.153


Epoch 342: 2batch [00:00, 12.19batch/s, loss=1.39e+3]

epoch 341: avg test  loss 1433.27, bar  test loss 2.463, len  test loss 0.028, col  test loss 129.029


Epoch 342: 272batch [00:22, 12.35batch/s, loss=1.43e+3]


epoch 342: avg train loss 1403.07, bar train loss 2.309, len train loss 0.026, col train loss 126.129


Epoch 343: 2batch [00:00, 12.12batch/s, loss=1.42e+3]

epoch 342: avg test  loss 1433.09, bar  test loss 2.525, len  test loss 0.031, col  test loss 129.148


Epoch 343: 272batch [00:21, 12.38batch/s, loss=1.33e+3]


epoch 343: avg train loss 1402.67, bar train loss 2.295, len train loss 0.025, col train loss 126.092


Epoch 344: 2batch [00:00, 12.58batch/s, loss=1.45e+3]

epoch 343: avg test  loss 1433.92, bar  test loss 2.553, len  test loss 0.029, col  test loss 128.798


Epoch 344: 272batch [00:22, 12.36batch/s, loss=1.5e+3] 


epoch 344: avg train loss 1403.23, bar train loss 2.303, len train loss 0.026, col train loss 126.121


Epoch 345: 2batch [00:00, 12.50batch/s, loss=1.36e+3]

epoch 344: avg test  loss 1432.81, bar  test loss 2.427, len  test loss 0.029, col  test loss 129.137


Epoch 345: 272batch [00:22, 12.36batch/s, loss=1.49e+3]


epoch 345: avg train loss 1403.09, bar train loss 2.296, len train loss 0.025, col train loss 126.103
epoch 345: avg test  loss 1432.52, bar  test loss 2.451, len  test loss 0.028, col  test loss 129.178


Epoch 346: 272batch [00:23, 11.61batch/s, loss=1.52e+3]


epoch 346: avg train loss 1402.39, bar train loss 2.287, len train loss 0.026, col train loss 126.044


Epoch 347: 2batch [00:00, 12.99batch/s, loss=1.42e+3]

epoch 346: avg test  loss 1431.78, bar  test loss 2.423, len  test loss 0.029, col  test loss 129.115


Epoch 347: 272batch [00:22, 12.31batch/s, loss=1.47e+3]


epoch 347: avg train loss 1402.45, bar train loss 2.298, len train loss 0.026, col train loss 126.047


Epoch 348: 2batch [00:00, 12.58batch/s, loss=1.46e+3]

epoch 347: avg test  loss 1432.43, bar  test loss 2.461, len  test loss 0.030, col  test loss 128.862


Epoch 348: 272batch [00:22, 12.32batch/s, loss=1.29e+3]


epoch 348: avg train loss 1402.07, bar train loss 2.307, len train loss 0.026, col train loss 126.003


Epoch 349: 2batch [00:00, 12.35batch/s, loss=1.39e+3]

epoch 348: avg test  loss 1431.83, bar  test loss 2.448, len  test loss 0.032, col  test loss 128.853


Epoch 349: 272batch [00:21, 12.37batch/s, loss=1.45e+3]


epoch 349: avg train loss 1401.22, bar train loss 2.286, len train loss 0.026, col train loss 125.954


Epoch 350: 2batch [00:00, 12.90batch/s, loss=1.42e+3]

epoch 349: avg test  loss 1433.17, bar  test loss 2.496, len  test loss 0.029, col  test loss 129.059


Epoch 350: 272batch [00:22, 12.33batch/s, loss=1.29e+3]


epoch 350: avg train loss 1401.58, bar train loss 2.296, len train loss 0.026, col train loss 125.958
epoch 350: avg test  loss 1431.73, bar  test loss 2.475, len  test loss 0.030, col  test loss 128.814


Epoch 351: 272batch [00:23, 11.67batch/s, loss=1.42e+3]


epoch 351: avg train loss 1401.53, bar train loss 2.287, len train loss 0.026, col train loss 125.927


Epoch 352: 1batch [00:00,  8.85batch/s, loss=1.35e+3]

epoch 351: avg test  loss 1431.12, bar  test loss 2.417, len  test loss 0.029, col  test loss 128.791


Epoch 352: 272batch [00:22, 12.28batch/s, loss=1.4e+3] 


epoch 352: avg train loss 1401.03, bar train loss 2.288, len train loss 0.025, col train loss 125.904


Epoch 353: 2batch [00:00, 12.20batch/s, loss=1.37e+3]

epoch 352: avg test  loss 1430.80, bar  test loss 2.528, len  test loss 0.029, col  test loss 128.665


Epoch 353: 272batch [00:21, 12.37batch/s, loss=1.33e+3]


epoch 353: avg train loss 1400.76, bar train loss 2.290, len train loss 0.025, col train loss 125.853


Epoch 354: 2batch [00:00, 12.27batch/s, loss=1.42e+3]

epoch 353: avg test  loss 1430.18, bar  test loss 2.452, len  test loss 0.029, col  test loss 128.561


Epoch 354: 272batch [00:22, 12.34batch/s, loss=1.29e+3]


epoch 354: avg train loss 1400.66, bar train loss 2.291, len train loss 0.026, col train loss 125.801


Epoch 355: 2batch [00:00, 12.50batch/s, loss=1.41e+3]

epoch 354: avg test  loss 1432.40, bar  test loss 2.463, len  test loss 0.030, col  test loss 128.851


Epoch 355: 272batch [00:22, 12.31batch/s, loss=1.47e+3]


epoch 355: avg train loss 1400.58, bar train loss 2.290, len train loss 0.025, col train loss 125.806
epoch 355: avg test  loss 1428.99, bar  test loss 2.419, len  test loss 0.028, col  test loss 128.497


Epoch 356: 272batch [00:23, 11.82batch/s, loss=1.4e+3] 


epoch 356: avg train loss 1400.17, bar train loss 2.286, len train loss 0.025, col train loss 125.763


Epoch 357: 2batch [00:00, 12.50batch/s, loss=1.42e+3]

epoch 356: avg test  loss 1429.86, bar  test loss 2.471, len  test loss 0.029, col  test loss 128.687


Epoch 357: 272batch [00:22, 12.27batch/s, loss=1.36e+3]


epoch 357: avg train loss 1400.17, bar train loss 2.290, len train loss 0.025, col train loss 125.738


Epoch 358: 2batch [00:00, 12.50batch/s, loss=1.42e+3]

epoch 357: avg test  loss 1432.14, bar  test loss 2.477, len  test loss 0.033, col  test loss 128.677


Epoch 358: 272batch [00:22, 12.21batch/s, loss=1.46e+3]


epoch 358: avg train loss 1399.64, bar train loss 2.280, len train loss 0.025, col train loss 125.710


Epoch 359: 2batch [00:00, 12.74batch/s, loss=1.37e+3]

epoch 358: avg test  loss 1430.62, bar  test loss 2.422, len  test loss 0.029, col  test loss 128.483


Epoch 359: 272batch [00:22, 12.19batch/s, loss=1.39e+3]


epoch 359: avg train loss 1399.36, bar train loss 2.291, len train loss 0.025, col train loss 125.686


Epoch 360: 2batch [00:00, 12.58batch/s, loss=1.39e+3]

epoch 359: avg test  loss 1430.78, bar  test loss 2.476, len  test loss 0.029, col  test loss 128.386


Epoch 360: 272batch [00:22, 12.21batch/s, loss=1.42e+3]


epoch 360: avg train loss 1399.81, bar train loss 2.294, len train loss 0.025, col train loss 125.706
epoch 360: avg test  loss 1429.61, bar  test loss 2.462, len  test loss 0.033, col  test loss 128.670


Epoch 361: 272batch [00:23, 11.77batch/s, loss=1.46e+3]


epoch 361: avg train loss 1399.28, bar train loss 2.286, len train loss 0.025, col train loss 125.649


Epoch 362: 2batch [00:00, 12.82batch/s, loss=1.35e+3]

epoch 361: avg test  loss 1429.75, bar  test loss 2.512, len  test loss 0.029, col  test loss 128.571


Epoch 362: 272batch [00:22, 12.21batch/s, loss=1.43e+3]


epoch 362: avg train loss 1399.34, bar train loss 2.295, len train loss 0.026, col train loss 125.641


Epoch 363: 2batch [00:00, 12.82batch/s, loss=1.35e+3]

epoch 362: avg test  loss 1430.58, bar  test loss 2.477, len  test loss 0.031, col  test loss 128.846


Epoch 363: 272batch [00:22, 12.19batch/s, loss=1.45e+3]


epoch 363: avg train loss 1398.96, bar train loss 2.280, len train loss 0.026, col train loss 125.625


Epoch 364: 2batch [00:00, 12.42batch/s, loss=1.41e+3]

epoch 363: avg test  loss 1428.93, bar  test loss 2.440, len  test loss 0.028, col  test loss 128.472


Epoch 364: 272batch [00:22, 12.18batch/s, loss=1.4e+3] 


epoch 364: avg train loss 1398.73, bar train loss 2.289, len train loss 0.025, col train loss 125.566


Epoch 365: 2batch [00:00, 12.42batch/s, loss=1.48e+3]

epoch 364: avg test  loss 1428.22, bar  test loss 2.449, len  test loss 0.028, col  test loss 128.472


Epoch 365: 272batch [00:22, 12.19batch/s, loss=1.46e+3]


epoch 365: avg train loss 1398.66, bar train loss 2.288, len train loss 0.025, col train loss 125.567
epoch 365: avg test  loss 1429.97, bar  test loss 2.513, len  test loss 0.031, col  test loss 128.788


Epoch 366: 272batch [00:23, 11.72batch/s, loss=1.42e+3]


epoch 366: avg train loss 1398.62, bar train loss 2.284, len train loss 0.026, col train loss 125.595


Epoch 367: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 366: avg test  loss 1429.83, bar  test loss 2.465, len  test loss 0.028, col  test loss 128.688


Epoch 367: 272batch [00:22, 12.20batch/s, loss=1.44e+3]


epoch 367: avg train loss 1398.55, bar train loss 2.286, len train loss 0.025, col train loss 125.545


Epoch 368: 2batch [00:00, 12.12batch/s, loss=1.41e+3]

epoch 367: avg test  loss 1430.15, bar  test loss 2.514, len  test loss 0.029, col  test loss 128.596


Epoch 368: 272batch [00:22, 12.13batch/s, loss=1.3e+3] 


epoch 368: avg train loss 1397.76, bar train loss 2.277, len train loss 0.025, col train loss 125.443


Epoch 369: 2batch [00:00, 12.27batch/s, loss=1.41e+3]

epoch 368: avg test  loss 1430.35, bar  test loss 2.482, len  test loss 0.029, col  test loss 128.337


Epoch 369: 272batch [00:22, 12.07batch/s, loss=1.32e+3]


epoch 369: avg train loss 1398.51, bar train loss 2.290, len train loss 0.026, col train loss 125.533


Epoch 370: 2batch [00:00, 12.58batch/s, loss=1.49e+3]

epoch 369: avg test  loss 1428.97, bar  test loss 2.502, len  test loss 0.029, col  test loss 128.545


Epoch 370: 272batch [00:22, 12.11batch/s, loss=1.33e+3]


epoch 370: avg train loss 1397.64, bar train loss 2.277, len train loss 0.025, col train loss 125.462
epoch 370: avg test  loss 1429.38, bar  test loss 2.548, len  test loss 0.029, col  test loss 128.349


Epoch 371: 272batch [00:23, 11.48batch/s, loss=1.5e+3] 


epoch 371: avg train loss 1396.92, bar train loss 2.270, len train loss 0.025, col train loss 125.366


Epoch 372: 2batch [00:00, 12.50batch/s, loss=1.39e+3]

epoch 371: avg test  loss 1428.13, bar  test loss 2.460, len  test loss 0.029, col  test loss 128.444


Epoch 372: 272batch [00:22, 12.10batch/s, loss=1.41e+3]


epoch 372: avg train loss 1397.10, bar train loss 2.279, len train loss 0.026, col train loss 125.361


Epoch 373: 2batch [00:00, 12.58batch/s, loss=1.41e+3]

epoch 372: avg test  loss 1429.71, bar  test loss 2.422, len  test loss 0.028, col  test loss 128.359


Epoch 373: 272batch [00:22, 12.08batch/s, loss=1.3e+3] 


epoch 373: avg train loss 1397.20, bar train loss 2.274, len train loss 0.025, col train loss 125.371


Epoch 374: 2batch [00:00, 12.20batch/s, loss=1.43e+3]

epoch 373: avg test  loss 1427.82, bar  test loss 2.446, len  test loss 0.028, col  test loss 128.332


Epoch 374: 272batch [00:22, 12.06batch/s, loss=1.38e+3]


epoch 374: avg train loss 1397.16, bar train loss 2.284, len train loss 0.025, col train loss 125.354


Epoch 375: 2batch [00:00, 12.58batch/s, loss=1.39e+3]

epoch 374: avg test  loss 1427.12, bar  test loss 2.451, len  test loss 0.029, col  test loss 128.384


Epoch 375: 272batch [00:22, 12.01batch/s, loss=1.39e+3]


epoch 375: avg train loss 1396.45, bar train loss 2.265, len train loss 0.025, col train loss 125.324
epoch 375: avg test  loss 1427.48, bar  test loss 2.475, len  test loss 0.034, col  test loss 128.442


Epoch 376: 272batch [00:23, 11.44batch/s, loss=1.32e+3]


epoch 376: avg train loss 1397.12, bar train loss 2.284, len train loss 0.025, col train loss 125.346


Epoch 377: 2batch [00:00, 12.20batch/s, loss=1.43e+3]

epoch 376: avg test  loss 1428.29, bar  test loss 2.475, len  test loss 0.029, col  test loss 128.426


Epoch 377: 272batch [00:22, 12.00batch/s, loss=1.33e+3]


epoch 377: avg train loss 1396.38, bar train loss 2.280, len train loss 0.026, col train loss 125.269


Epoch 378: 2batch [00:00, 12.27batch/s, loss=1.46e+3]

epoch 377: avg test  loss 1427.00, bar  test loss 2.483, len  test loss 0.029, col  test loss 128.389


Epoch 378: 272batch [00:22, 11.99batch/s, loss=1.39e+3]


epoch 378: avg train loss 1395.67, bar train loss 2.277, len train loss 0.026, col train loss 125.204


Epoch 379: 2batch [00:00, 12.35batch/s, loss=1.4e+3]

epoch 378: avg test  loss 1426.25, bar  test loss 2.473, len  test loss 0.030, col  test loss 128.224


Epoch 379: 272batch [00:22, 11.97batch/s, loss=1.26e+3]


epoch 379: avg train loss 1396.15, bar train loss 2.283, len train loss 0.025, col train loss 125.254


Epoch 380: 2batch [00:00, 12.35batch/s, loss=1.38e+3]

epoch 379: avg test  loss 1427.33, bar  test loss 2.478, len  test loss 0.028, col  test loss 128.160


Epoch 380: 272batch [00:22, 11.83batch/s, loss=1.25e+3]


epoch 380: avg train loss 1395.92, bar train loss 2.290, len train loss 0.025, col train loss 125.219
epoch 380: avg test  loss 1426.43, bar  test loss 2.466, len  test loss 0.028, col  test loss 128.358


Epoch 381: 272batch [00:24, 11.30batch/s, loss=1.48e+3]


epoch 381: avg train loss 1396.05, bar train loss 2.282, len train loss 0.025, col train loss 125.217


Epoch 382: 2batch [00:00, 12.35batch/s, loss=1.38e+3]

epoch 381: avg test  loss 1425.04, bar  test loss 2.461, len  test loss 0.030, col  test loss 128.019


Epoch 382: 272batch [00:22, 11.96batch/s, loss=1.46e+3]


epoch 382: avg train loss 1395.61, bar train loss 2.280, len train loss 0.025, col train loss 125.153


Epoch 383: 0batch [00:00, ?batch/s]

epoch 382: avg test  loss 1428.55, bar  test loss 2.551, len  test loss 0.028, col  test loss 128.399


Epoch 383: 272batch [00:22, 11.97batch/s, loss=1.38e+3]


epoch 383: avg train loss 1395.57, bar train loss 2.268, len train loss 0.025, col train loss 125.143


Epoch 384: 2batch [00:00, 12.74batch/s, loss=1.36e+3]

epoch 383: avg test  loss 1426.88, bar  test loss 2.415, len  test loss 0.030, col  test loss 127.958


Epoch 384: 272batch [00:22, 11.91batch/s, loss=1.39e+3]


epoch 384: avg train loss 1395.21, bar train loss 2.271, len train loss 0.026, col train loss 125.121


Epoch 385: 0batch [00:00, ?batch/s, loss=1.36e+3]

epoch 384: avg test  loss 1424.76, bar  test loss 2.414, len  test loss 0.029, col  test loss 128.094


Epoch 385: 272batch [00:22, 11.88batch/s, loss=1.5e+3] 


epoch 385: avg train loss 1395.48, bar train loss 2.272, len train loss 0.026, col train loss 125.142
epoch 385: avg test  loss 1425.72, bar  test loss 2.473, len  test loss 0.029, col  test loss 128.001


Epoch 386: 272batch [00:23, 11.43batch/s, loss=1.41e+3]


epoch 386: avg train loss 1395.19, bar train loss 2.265, len train loss 0.025, col train loss 125.106


Epoch 387: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 386: avg test  loss 1428.58, bar  test loss 2.572, len  test loss 0.028, col  test loss 128.189


Epoch 387: 272batch [00:22, 11.92batch/s, loss=1.4e+3] 


epoch 387: avg train loss 1394.78, bar train loss 2.276, len train loss 0.025, col train loss 125.050


Epoch 388: 2batch [00:00, 12.35batch/s, loss=1.49e+3]

epoch 387: avg test  loss 1427.18, bar  test loss 2.530, len  test loss 0.029, col  test loss 128.267


Epoch 388: 272batch [00:22, 11.92batch/s, loss=1.37e+3]


epoch 388: avg train loss 1394.52, bar train loss 2.273, len train loss 0.026, col train loss 125.057


Epoch 389: 2batch [00:00, 12.20batch/s, loss=1.35e+3]

epoch 388: avg test  loss 1425.66, bar  test loss 2.414, len  test loss 0.029, col  test loss 128.279


Epoch 389: 272batch [00:22, 11.83batch/s, loss=1.28e+3]


epoch 389: avg train loss 1394.58, bar train loss 2.264, len train loss 0.025, col train loss 125.062


Epoch 390: 2batch [00:00, 11.70batch/s, loss=1.4e+3]

epoch 389: avg test  loss 1427.50, bar  test loss 2.463, len  test loss 0.028, col  test loss 127.960


Epoch 390: 272batch [00:23, 11.82batch/s, loss=1.36e+3]


epoch 390: avg train loss 1394.04, bar train loss 2.275, len train loss 0.025, col train loss 124.973
epoch 390: avg test  loss 1425.38, bar  test loss 2.424, len  test loss 0.028, col  test loss 128.132


Epoch 391: 272batch [00:24, 11.08batch/s, loss=1.42e+3]


epoch 391: avg train loss 1394.64, bar train loss 2.272, len train loss 0.025, col train loss 125.040


Epoch 392: 2batch [00:00, 12.42batch/s, loss=1.45e+3]

epoch 391: avg test  loss 1425.52, bar  test loss 2.446, len  test loss 0.028, col  test loss 127.793


Epoch 392: 272batch [00:23, 11.82batch/s, loss=1.45e+3]


epoch 392: avg train loss 1394.54, bar train loss 2.277, len train loss 0.025, col train loss 125.007


Epoch 393: 2batch [00:00, 12.20batch/s, loss=1.42e+3]

epoch 392: avg test  loss 1424.27, bar  test loss 2.440, len  test loss 0.028, col  test loss 128.028


Epoch 393: 272batch [00:23, 11.74batch/s, loss=1.4e+3] 


epoch 393: avg train loss 1393.59, bar train loss 2.259, len train loss 0.025, col train loss 124.904


Epoch 394: 2batch [00:00, 12.42batch/s, loss=1.41e+3]

epoch 393: avg test  loss 1427.02, bar  test loss 2.464, len  test loss 0.028, col  test loss 128.163


Epoch 394: 272batch [00:23, 11.74batch/s, loss=1.4e+3] 


epoch 394: avg train loss 1393.86, bar train loss 2.269, len train loss 0.025, col train loss 124.947


Epoch 395: 2batch [00:00, 11.63batch/s, loss=1.43e+3]

epoch 394: avg test  loss 1425.04, bar  test loss 2.450, len  test loss 0.028, col  test loss 127.714


Epoch 395: 272batch [00:23, 11.75batch/s, loss=1.4e+3] 


epoch 395: avg train loss 1393.63, bar train loss 2.274, len train loss 0.025, col train loss 124.918
epoch 395: avg test  loss 1425.86, bar  test loss 2.492, len  test loss 0.030, col  test loss 127.701


Epoch 396: 272batch [00:24, 11.27batch/s, loss=1.36e+3]


epoch 396: avg train loss 1393.55, bar train loss 2.271, len train loss 0.025, col train loss 124.910


Epoch 397: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 396: avg test  loss 1423.95, bar  test loss 2.426, len  test loss 0.029, col  test loss 128.035


Epoch 397: 272batch [00:23, 11.77batch/s, loss=1.34e+3]


epoch 397: avg train loss 1393.20, bar train loss 2.274, len train loss 0.025, col train loss 124.860


Epoch 398: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 397: avg test  loss 1424.36, bar  test loss 2.447, len  test loss 0.027, col  test loss 127.714


Epoch 398: 272batch [00:23, 11.76batch/s, loss=1.49e+3]


epoch 398: avg train loss 1393.18, bar train loss 2.268, len train loss 0.025, col train loss 124.839


Epoch 399: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 398: avg test  loss 1424.82, bar  test loss 2.475, len  test loss 0.028, col  test loss 127.790


Epoch 399: 272batch [00:23, 11.72batch/s, loss=1.36e+3]


epoch 399: avg train loss 1393.15, bar train loss 2.272, len train loss 0.026, col train loss 124.850


Epoch 400: 2batch [00:00, 12.05batch/s, loss=1.43e+3]

epoch 399: avg test  loss 1423.16, bar  test loss 2.413, len  test loss 0.028, col  test loss 127.862


Epoch 400: 272batch [00:23, 11.74batch/s, loss=1.35e+3]


epoch 400: avg train loss 1392.79, bar train loss 2.274, len train loss 0.025, col train loss 124.796
epoch 400: avg test  loss 1425.14, bar  test loss 2.458, len  test loss 0.030, col  test loss 127.691


Epoch 401: 272batch [00:24, 11.02batch/s, loss=1.39e+3]


epoch 401: avg train loss 1392.88, bar train loss 2.271, len train loss 0.025, col train loss 124.793


Epoch 402: 2batch [00:00, 12.27batch/s, loss=1.38e+3]

epoch 401: avg test  loss 1424.78, bar  test loss 2.437, len  test loss 0.028, col  test loss 128.059


Epoch 402: 272batch [00:23, 11.67batch/s, loss=1.32e+3]


epoch 402: avg train loss 1392.65, bar train loss 2.270, len train loss 0.025, col train loss 124.771


Epoch 403: 2batch [00:00, 12.12batch/s, loss=1.37e+3]

epoch 402: avg test  loss 1424.91, bar  test loss 2.514, len  test loss 0.034, col  test loss 127.911


Epoch 403: 272batch [00:23, 11.66batch/s, loss=1.44e+3]


epoch 403: avg train loss 1392.33, bar train loss 2.261, len train loss 0.025, col train loss 124.728


Epoch 404: 2batch [00:00, 12.35batch/s, loss=1.39e+3]

epoch 403: avg test  loss 1424.50, bar  test loss 2.424, len  test loss 0.029, col  test loss 128.091


Epoch 404: 272batch [00:23, 11.65batch/s, loss=1.39e+3]


epoch 404: avg train loss 1391.60, bar train loss 2.266, len train loss 0.026, col train loss 124.677


Epoch 405: 2batch [00:00, 12.42batch/s, loss=1.44e+3]

epoch 404: avg test  loss 1423.40, bar  test loss 2.439, len  test loss 0.029, col  test loss 127.833


Epoch 405: 272batch [00:23, 11.68batch/s, loss=1.37e+3]


epoch 405: avg train loss 1392.19, bar train loss 2.270, len train loss 0.025, col train loss 124.706
epoch 405: avg test  loss 1422.69, bar  test loss 2.407, len  test loss 0.028, col  test loss 127.396


Epoch 406: 272batch [00:24, 11.15batch/s, loss=1.34e+3]


epoch 406: avg train loss 1391.09, bar train loss 2.263, len train loss 0.025, col train loss 124.601


Epoch 407: 2batch [00:00, 12.19batch/s, loss=1.37e+3]

epoch 406: avg test  loss 1425.23, bar  test loss 2.423, len  test loss 0.032, col  test loss 127.836


Epoch 407: 272batch [00:23, 11.63batch/s, loss=1.38e+3]


epoch 407: avg train loss 1392.00, bar train loss 2.265, len train loss 0.025, col train loss 124.681


Epoch 408: 2batch [00:00, 12.12batch/s, loss=1.38e+3]

epoch 407: avg test  loss 1423.58, bar  test loss 2.472, len  test loss 0.029, col  test loss 127.866


Epoch 408: 272batch [00:23, 11.64batch/s, loss=1.46e+3]


epoch 408: avg train loss 1391.88, bar train loss 2.267, len train loss 0.026, col train loss 124.644


Epoch 409: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 408: avg test  loss 1423.68, bar  test loss 2.370, len  test loss 0.028, col  test loss 127.646


Epoch 409: 272batch [00:23, 11.59batch/s, loss=1.37e+3]


epoch 409: avg train loss 1391.78, bar train loss 2.250, len train loss 0.025, col train loss 124.657


Epoch 410: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 409: avg test  loss 1426.44, bar  test loss 2.479, len  test loss 0.032, col  test loss 127.827


Epoch 410: 272batch [00:23, 11.61batch/s, loss=1.52e+3]


epoch 410: avg train loss 1391.32, bar train loss 2.269, len train loss 0.025, col train loss 124.624
epoch 410: avg test  loss 1428.77, bar  test loss 2.447, len  test loss 0.027, col  test loss 127.912


Epoch 411: 272batch [00:24, 11.07batch/s, loss=1.39e+3]


epoch 411: avg train loss 1391.18, bar train loss 2.264, len train loss 0.025, col train loss 124.600


Epoch 412: 2batch [00:00, 12.35batch/s, loss=1.39e+3]

epoch 411: avg test  loss 1422.47, bar  test loss 2.453, len  test loss 0.029, col  test loss 127.659


Epoch 412: 272batch [00:23, 11.48batch/s, loss=1.41e+3]


epoch 412: avg train loss 1391.09, bar train loss 2.271, len train loss 0.025, col train loss 124.553


Epoch 413: 0batch [00:00, ?batch/s, loss=1.4e+3] 

epoch 412: avg test  loss 1424.29, bar  test loss 2.449, len  test loss 0.028, col  test loss 127.437


Epoch 413: 272batch [00:23, 11.54batch/s, loss=1.39e+3]


epoch 413: avg train loss 1390.80, bar train loss 2.261, len train loss 0.025, col train loss 124.538


Epoch 414: 0batch [00:00, ?batch/s, loss=1.36e+3]

epoch 413: avg test  loss 1423.22, bar  test loss 2.462, len  test loss 0.029, col  test loss 127.575


Epoch 414: 272batch [00:23, 11.56batch/s, loss=1.51e+3]


epoch 414: avg train loss 1390.78, bar train loss 2.259, len train loss 0.025, col train loss 124.526


Epoch 415: 0batch [00:00, ?batch/s, loss=1.44e+3]

epoch 414: avg test  loss 1422.89, bar  test loss 2.443, len  test loss 0.028, col  test loss 127.904


Epoch 415: 272batch [00:23, 11.49batch/s, loss=1.42e+3]


epoch 415: avg train loss 1390.97, bar train loss 2.257, len train loss 0.025, col train loss 124.557
epoch 415: avg test  loss 1424.08, bar  test loss 2.418, len  test loss 0.029, col  test loss 127.569


Epoch 416: 272batch [00:24, 11.05batch/s, loss=1.46e+3]


epoch 416: avg train loss 1391.00, bar train loss 2.266, len train loss 0.025, col train loss 124.533


Epoch 417: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 416: avg test  loss 1422.11, bar  test loss 2.485, len  test loss 0.029, col  test loss 127.399


Epoch 417: 272batch [00:23, 11.48batch/s, loss=1.48e+3]


epoch 417: avg train loss 1390.71, bar train loss 2.262, len train loss 0.025, col train loss 124.483


Epoch 418: 0batch [00:00, ?batch/s, loss=1.34e+3]

epoch 417: avg test  loss 1423.28, bar  test loss 2.407, len  test loss 0.028, col  test loss 127.620


Epoch 418: 272batch [00:23, 11.52batch/s, loss=1.31e+3]


epoch 418: avg train loss 1390.65, bar train loss 2.266, len train loss 0.025, col train loss 124.509


Epoch 419: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 418: avg test  loss 1422.47, bar  test loss 2.455, len  test loss 0.028, col  test loss 127.131


Epoch 419: 272batch [00:23, 11.46batch/s, loss=1.46e+3]


epoch 419: avg train loss 1389.89, bar train loss 2.248, len train loss 0.025, col train loss 124.433


Epoch 420: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 419: avg test  loss 1423.31, bar  test loss 2.546, len  test loss 0.030, col  test loss 127.498


Epoch 420: 272batch [00:23, 11.51batch/s, loss=1.4e+3] 


epoch 420: avg train loss 1389.58, bar train loss 2.249, len train loss 0.025, col train loss 124.355
epoch 420: avg test  loss 1420.42, bar  test loss 2.386, len  test loss 0.029, col  test loss 127.395


Epoch 421: 272batch [00:25, 10.85batch/s, loss=1.43e+3]


epoch 421: avg train loss 1389.97, bar train loss 2.257, len train loss 0.025, col train loss 124.380


Epoch 422: 0batch [00:00, ?batch/s, loss=1.35e+3]

epoch 421: avg test  loss 1421.54, bar  test loss 2.441, len  test loss 0.029, col  test loss 127.557


Epoch 422: 272batch [00:23, 11.49batch/s, loss=1.33e+3]


epoch 422: avg train loss 1389.87, bar train loss 2.251, len train loss 0.025, col train loss 124.375


Epoch 423: 2batch [00:00, 11.98batch/s, loss=1.44e+3]

epoch 422: avg test  loss 1421.23, bar  test loss 2.474, len  test loss 0.029, col  test loss 127.541


Epoch 423: 272batch [00:23, 11.45batch/s, loss=1.41e+3]


epoch 423: avg train loss 1390.17, bar train loss 2.255, len train loss 0.025, col train loss 124.392


Epoch 424: 2batch [00:00, 12.05batch/s, loss=1.38e+3]

epoch 423: avg test  loss 1422.53, bar  test loss 2.396, len  test loss 0.029, col  test loss 127.577


Epoch 424: 272batch [00:23, 11.45batch/s, loss=1.38e+3]


epoch 424: avg train loss 1389.61, bar train loss 2.251, len train loss 0.025, col train loss 124.360


Epoch 425: 2batch [00:00, 11.56batch/s, loss=1.32e+3]

epoch 424: avg test  loss 1423.23, bar  test loss 2.475, len  test loss 0.027, col  test loss 127.529


Epoch 425: 272batch [00:23, 11.39batch/s, loss=1.41e+3]


epoch 425: avg train loss 1389.52, bar train loss 2.259, len train loss 0.025, col train loss 124.335
epoch 425: avg test  loss 1421.60, bar  test loss 2.422, len  test loss 0.028, col  test loss 127.088


Epoch 426: 272batch [00:25, 10.82batch/s, loss=1.37e+3]


epoch 426: avg train loss 1389.63, bar train loss 2.262, len train loss 0.025, col train loss 124.326


Epoch 427: 0batch [00:00, ?batch/s]

epoch 426: avg test  loss 1423.18, bar  test loss 2.474, len  test loss 0.029, col  test loss 127.408


Epoch 427: 272batch [00:24, 11.17batch/s, loss=1.41e+3]


epoch 427: avg train loss 1389.55, bar train loss 2.264, len train loss 0.025, col train loss 124.333


Epoch 428: 2batch [00:00, 11.76batch/s, loss=1.39e+3]

epoch 427: avg test  loss 1422.26, bar  test loss 2.501, len  test loss 0.028, col  test loss 127.878


Epoch 428: 272batch [00:23, 11.42batch/s, loss=1.5e+3] 


epoch 428: avg train loss 1389.24, bar train loss 2.264, len train loss 0.025, col train loss 124.309


Epoch 429: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 428: avg test  loss 1423.41, bar  test loss 2.494, len  test loss 0.032, col  test loss 127.577


Epoch 429: 272batch [00:23, 11.39batch/s, loss=1.57e+3]


epoch 429: avg train loss 1389.15, bar train loss 2.261, len train loss 0.025, col train loss 124.289


Epoch 430: 0batch [00:00, ?batch/s, loss=1.47e+3]

epoch 429: avg test  loss 1421.75, bar  test loss 2.442, len  test loss 0.030, col  test loss 127.193


Epoch 430: 272batch [00:23, 11.41batch/s, loss=1.37e+3]


epoch 430: avg train loss 1389.11, bar train loss 2.265, len train loss 0.025, col train loss 124.251
epoch 430: avg test  loss 1421.14, bar  test loss 2.465, len  test loss 0.030, col  test loss 127.270


Epoch 431: 272batch [00:25, 10.82batch/s, loss=1.35e+3]


epoch 431: avg train loss 1388.81, bar train loss 2.257, len train loss 0.025, col train loss 124.273


Epoch 432: 2batch [00:00, 12.12batch/s, loss=1.3e+3]

epoch 431: avg test  loss 1423.04, bar  test loss 2.470, len  test loss 0.038, col  test loss 127.467


Epoch 432: 272batch [00:23, 11.38batch/s, loss=1.37e+3]


epoch 432: avg train loss 1389.07, bar train loss 2.257, len train loss 0.025, col train loss 124.266


Epoch 433: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 432: avg test  loss 1423.63, bar  test loss 2.437, len  test loss 0.029, col  test loss 127.356


Epoch 433: 272batch [00:23, 11.36batch/s, loss=1.33e+3]


epoch 433: avg train loss 1388.83, bar train loss 2.253, len train loss 0.025, col train loss 124.235


Epoch 434: 0batch [00:00, ?batch/s, loss=1.4e+3] 

epoch 433: avg test  loss 1422.30, bar  test loss 2.441, len  test loss 0.033, col  test loss 127.347


Epoch 434: 272batch [00:24, 11.28batch/s, loss=1.29e+3]


epoch 434: avg train loss 1388.59, bar train loss 2.255, len train loss 0.025, col train loss 124.210


Epoch 435: 2batch [00:00, 11.90batch/s, loss=1.36e+3]

epoch 434: avg test  loss 1421.49, bar  test loss 2.450, len  test loss 0.030, col  test loss 127.591


Epoch 435: 272batch [00:23, 11.36batch/s, loss=1.41e+3]


epoch 435: avg train loss 1388.68, bar train loss 2.252, len train loss 0.025, col train loss 124.223
epoch 435: avg test  loss 1422.83, bar  test loss 2.450, len  test loss 0.032, col  test loss 127.227


Epoch 436: 272batch [00:25, 10.73batch/s, loss=1.43e+3]


epoch 436: avg train loss 1388.27, bar train loss 2.252, len train loss 0.025, col train loss 124.151


Epoch 437: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 436: avg test  loss 1420.34, bar  test loss 2.438, len  test loss 0.028, col  test loss 127.159


Epoch 437: 272batch [00:24, 11.31batch/s, loss=1.43e+3]


epoch 437: avg train loss 1388.10, bar train loss 2.249, len train loss 0.025, col train loss 124.147


Epoch 438: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 437: avg test  loss 1420.39, bar  test loss 2.463, len  test loss 0.029, col  test loss 127.225


Epoch 438: 272batch [00:24, 11.33batch/s, loss=1.38e+3]


epoch 438: avg train loss 1388.44, bar train loss 2.261, len train loss 0.025, col train loss 124.156


Epoch 439: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 438: avg test  loss 1420.82, bar  test loss 2.470, len  test loss 0.031, col  test loss 127.299


Epoch 439: 272batch [00:24, 11.29batch/s, loss=1.37e+3]


epoch 439: avg train loss 1388.09, bar train loss 2.244, len train loss 0.025, col train loss 124.092


Epoch 440: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 439: avg test  loss 1422.53, bar  test loss 2.492, len  test loss 0.030, col  test loss 127.511


Epoch 440: 272batch [00:24, 11.33batch/s, loss=1.42e+3]


epoch 440: avg train loss 1388.11, bar train loss 2.259, len train loss 0.025, col train loss 124.118
epoch 440: avg test  loss 1421.89, bar  test loss 2.435, len  test loss 0.028, col  test loss 127.328


Epoch 441: 272batch [00:25, 10.63batch/s, loss=1.49e+3]


epoch 441: avg train loss 1388.03, bar train loss 2.256, len train loss 0.025, col train loss 124.075


Epoch 442: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 441: avg test  loss 1420.10, bar  test loss 2.487, len  test loss 0.028, col  test loss 127.131


Epoch 442: 272batch [00:24, 11.29batch/s, loss=1.42e+3]


epoch 442: avg train loss 1388.11, bar train loss 2.263, len train loss 0.025, col train loss 124.132


Epoch 443: 1batch [00:00,  9.90batch/s, loss=1.36e+3]

epoch 442: avg test  loss 1420.99, bar  test loss 2.449, len  test loss 0.028, col  test loss 127.253


Epoch 443: 272batch [00:24, 11.22batch/s, loss=1.35e+3]


epoch 443: avg train loss 1387.50, bar train loss 2.255, len train loss 0.025, col train loss 124.039


Epoch 444: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 443: avg test  loss 1420.68, bar  test loss 2.520, len  test loss 0.028, col  test loss 127.372


Epoch 444: 272batch [00:24, 11.14batch/s, loss=1.26e+3]


epoch 444: avg train loss 1387.79, bar train loss 2.250, len train loss 0.025, col train loss 124.090


Epoch 445: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 444: avg test  loss 1419.72, bar  test loss 2.457, len  test loss 0.029, col  test loss 127.037


Epoch 445: 272batch [00:24, 11.27batch/s, loss=1.42e+3]


epoch 445: avg train loss 1388.01, bar train loss 2.257, len train loss 0.025, col train loss 124.063
epoch 445: avg test  loss 1421.56, bar  test loss 2.538, len  test loss 0.029, col  test loss 127.439


Epoch 446: 272batch [00:25, 10.58batch/s, loss=1.45e+3]


epoch 446: avg train loss 1387.48, bar train loss 2.260, len train loss 0.025, col train loss 124.013


Epoch 447: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 446: avg test  loss 1423.43, bar  test loss 2.480, len  test loss 0.029, col  test loss 127.522


Epoch 447: 272batch [00:24, 11.21batch/s, loss=1.35e+3]


epoch 447: avg train loss 1387.60, bar train loss 2.252, len train loss 0.025, col train loss 124.035


Epoch 448: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 447: avg test  loss 1420.53, bar  test loss 2.377, len  test loss 0.029, col  test loss 126.912


Epoch 448: 272batch [00:24, 11.23batch/s, loss=1.43e+3]


epoch 448: avg train loss 1387.41, bar train loss 2.247, len train loss 0.025, col train loss 124.031


Epoch 449: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 448: avg test  loss 1419.12, bar  test loss 2.410, len  test loss 0.034, col  test loss 127.154


Epoch 449: 272batch [00:24, 11.21batch/s, loss=1.38e+3]


epoch 449: avg train loss 1387.02, bar train loss 2.239, len train loss 0.025, col train loss 124.000


Epoch 450: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 449: avg test  loss 1421.67, bar  test loss 2.494, len  test loss 0.028, col  test loss 127.238


Epoch 450: 272batch [00:24, 11.05batch/s, loss=1.51e+3]


epoch 450: avg train loss 1387.33, bar train loss 2.248, len train loss 0.025, col train loss 123.977
epoch 450: avg test  loss 1420.61, bar  test loss 2.463, len  test loss 0.031, col  test loss 127.168


Epoch 451: 272batch [00:25, 10.47batch/s, loss=1.42e+3]


epoch 451: avg train loss 1387.46, bar train loss 2.239, len train loss 0.025, col train loss 123.982


Epoch 452: 0batch [00:00, ?batch/s, loss=1.31e+3]

epoch 451: avg test  loss 1420.57, bar  test loss 2.416, len  test loss 0.027, col  test loss 127.134


Epoch 452: 272batch [00:24, 11.20batch/s, loss=1.5e+3] 


epoch 452: avg train loss 1386.71, bar train loss 2.250, len train loss 0.025, col train loss 123.932


Epoch 453: 0batch [00:00, ?batch/s, loss=1.46e+3]

epoch 452: avg test  loss 1419.81, bar  test loss 2.549, len  test loss 0.030, col  test loss 127.201


Epoch 453: 272batch [00:24, 11.17batch/s, loss=1.26e+3]


epoch 453: avg train loss 1387.35, bar train loss 2.258, len train loss 0.025, col train loss 123.988


Epoch 454: 2batch [00:00, 11.90batch/s, loss=1.35e+3]

epoch 453: avg test  loss 1422.07, bar  test loss 2.516, len  test loss 0.029, col  test loss 127.275


Epoch 454: 272batch [00:24, 11.07batch/s, loss=1.41e+3]


epoch 454: avg train loss 1387.60, bar train loss 2.256, len train loss 0.025, col train loss 123.983


Epoch 455: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 454: avg test  loss 1419.95, bar  test loss 2.413, len  test loss 0.029, col  test loss 126.950


Epoch 455: 272batch [00:24, 11.16batch/s, loss=1.41e+3]


epoch 455: avg train loss 1386.80, bar train loss 2.253, len train loss 0.025, col train loss 123.925
epoch 455: avg test  loss 1418.78, bar  test loss 2.463, len  test loss 0.029, col  test loss 127.216


Epoch 456: 272batch [00:26, 10.45batch/s, loss=1.49e+3]


epoch 456: avg train loss 1386.88, bar train loss 2.245, len train loss 0.025, col train loss 123.941


Epoch 457: 0batch [00:00, ?batch/s, loss=1.36e+3]

epoch 456: avg test  loss 1420.69, bar  test loss 2.438, len  test loss 0.031, col  test loss 127.402


Epoch 457: 272batch [00:24, 11.13batch/s, loss=1.33e+3]


epoch 457: avg train loss 1387.47, bar train loss 2.252, len train loss 0.025, col train loss 123.978


Epoch 458: 2batch [00:00, 11.98batch/s, loss=1.35e+3]

epoch 457: avg test  loss 1419.75, bar  test loss 2.489, len  test loss 0.029, col  test loss 126.766


Epoch 458: 272batch [00:24, 11.18batch/s, loss=1.46e+3]


epoch 458: avg train loss 1386.50, bar train loss 2.254, len train loss 0.025, col train loss 123.892


Epoch 459: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 458: avg test  loss 1421.18, bar  test loss 2.512, len  test loss 0.029, col  test loss 127.132


Epoch 459: 272batch [00:24, 11.10batch/s, loss=1.54e+3]


epoch 459: avg train loss 1386.60, bar train loss 2.250, len train loss 0.025, col train loss 123.886


Epoch 460: 0batch [00:00, ?batch/s, loss=1.46e+3]

epoch 459: avg test  loss 1419.82, bar  test loss 2.552, len  test loss 0.030, col  test loss 127.104


Epoch 460: 272batch [00:24, 11.09batch/s, loss=1.35e+3]


epoch 460: avg train loss 1386.64, bar train loss 2.250, len train loss 0.025, col train loss 123.886
epoch 460: avg test  loss 1418.50, bar  test loss 2.376, len  test loss 0.028, col  test loss 127.323


Epoch 461: 272batch [00:26, 10.29batch/s, loss=1.54e+3]


epoch 461: avg train loss 1386.95, bar train loss 2.249, len train loss 0.025, col train loss 123.931


Epoch 462: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 461: avg test  loss 1419.27, bar  test loss 2.520, len  test loss 0.028, col  test loss 127.197


Epoch 462: 272batch [00:24, 11.10batch/s, loss=1.26e+3]


epoch 462: avg train loss 1387.68, bar train loss 2.258, len train loss 0.025, col train loss 123.988


Epoch 463: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 462: avg test  loss 1422.47, bar  test loss 2.706, len  test loss 0.029, col  test loss 126.948


Epoch 463: 272batch [00:24, 11.05batch/s, loss=1.31e+3]


epoch 463: avg train loss 1386.73, bar train loss 2.255, len train loss 0.025, col train loss 123.905


Epoch 464: 0batch [00:00, ?batch/s, loss=1.44e+3]

epoch 463: avg test  loss 1420.74, bar  test loss 2.451, len  test loss 0.028, col  test loss 127.358


Epoch 464: 272batch [00:24, 11.08batch/s, loss=1.25e+3]


epoch 464: avg train loss 1387.05, bar train loss 2.251, len train loss 0.025, col train loss 123.922


Epoch 465: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 464: avg test  loss 1419.82, bar  test loss 2.446, len  test loss 0.029, col  test loss 126.996


Epoch 465: 272batch [00:24, 11.01batch/s, loss=1.45e+3]


epoch 465: avg train loss 1386.49, bar train loss 2.253, len train loss 0.025, col train loss 123.862
epoch 465: avg test  loss 1421.35, bar  test loss 2.443, len  test loss 0.029, col  test loss 127.207


Epoch 466: 272batch [00:25, 10.51batch/s, loss=1.33e+3]


epoch 466: avg train loss 1386.68, bar train loss 2.248, len train loss 0.025, col train loss 123.897


Epoch 467: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 466: avg test  loss 1418.80, bar  test loss 2.426, len  test loss 0.027, col  test loss 126.630


Epoch 467: 272batch [00:24, 11.10batch/s, loss=1.37e+3]


epoch 467: avg train loss 1386.94, bar train loss 2.252, len train loss 0.025, col train loss 123.883


Epoch 468: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 467: avg test  loss 1418.97, bar  test loss 2.462, len  test loss 0.028, col  test loss 126.759


Epoch 468: 272batch [00:24, 11.01batch/s, loss=1.32e+3]


epoch 468: avg train loss 1386.50, bar train loss 2.253, len train loss 0.025, col train loss 123.836


Epoch 469: 0batch [00:00, ?batch/s]

epoch 468: avg test  loss 1418.58, bar  test loss 2.443, len  test loss 0.030, col  test loss 126.930


Epoch 469: 272batch [00:24, 11.03batch/s, loss=1.23e+3]


epoch 469: avg train loss 1386.43, bar train loss 2.244, len train loss 0.025, col train loss 123.835


Epoch 470: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 469: avg test  loss 1419.99, bar  test loss 2.439, len  test loss 0.028, col  test loss 126.854


Epoch 470: 272batch [00:24, 11.05batch/s, loss=1.33e+3]


epoch 470: avg train loss 1386.33, bar train loss 2.249, len train loss 0.025, col train loss 123.854
epoch 470: avg test  loss 1418.98, bar  test loss 2.440, len  test loss 0.029, col  test loss 127.274


Epoch 471: 272batch [00:26, 10.35batch/s, loss=1.41e+3]


epoch 471: avg train loss 1386.05, bar train loss 2.241, len train loss 0.025, col train loss 123.805


Epoch 472: 0batch [00:00, ?batch/s, loss=1.33e+3]

epoch 471: avg test  loss 1418.72, bar  test loss 2.422, len  test loss 0.028, col  test loss 127.068


Epoch 472: 272batch [00:24, 11.03batch/s, loss=1.33e+3]


epoch 472: avg train loss 1386.87, bar train loss 2.254, len train loss 0.025, col train loss 123.844


Epoch 473: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 472: avg test  loss 1419.41, bar  test loss 2.458, len  test loss 0.029, col  test loss 126.945


Epoch 473: 272batch [00:24, 10.97batch/s, loss=1.46e+3]


epoch 473: avg train loss 1386.63, bar train loss 2.253, len train loss 0.025, col train loss 123.841


Epoch 474: 0batch [00:00, ?batch/s, loss=1.35e+3]

epoch 473: avg test  loss 1418.46, bar  test loss 2.531, len  test loss 0.029, col  test loss 126.884


Epoch 474: 272batch [00:24, 10.99batch/s, loss=1.36e+3]


epoch 474: avg train loss 1386.06, bar train loss 2.257, len train loss 0.025, col train loss 123.785


Epoch 475: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 474: avg test  loss 1419.77, bar  test loss 2.524, len  test loss 0.028, col  test loss 127.003


Epoch 475: 272batch [00:24, 10.89batch/s, loss=1.36e+3]


epoch 475: avg train loss 1386.61, bar train loss 2.247, len train loss 0.025, col train loss 123.872
epoch 475: avg test  loss 1420.53, bar  test loss 2.521, len  test loss 0.029, col  test loss 127.052


Epoch 476: 272batch [00:26, 10.17batch/s, loss=1.56e+3]


epoch 476: avg train loss 1386.28, bar train loss 2.244, len train loss 0.025, col train loss 123.796


Epoch 477: 0batch [00:00, ?batch/s, loss=1.34e+3]

epoch 476: avg test  loss 1419.24, bar  test loss 2.447, len  test loss 0.029, col  test loss 127.279


Epoch 477: 272batch [00:24, 10.95batch/s, loss=1.31e+3]


epoch 477: avg train loss 1386.40, bar train loss 2.257, len train loss 0.025, col train loss 123.809


Epoch 478: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 477: avg test  loss 1419.50, bar  test loss 2.445, len  test loss 0.030, col  test loss 126.939


Epoch 478: 272batch [00:24, 10.90batch/s, loss=1.27e+3]


epoch 478: avg train loss 1386.04, bar train loss 2.249, len train loss 0.025, col train loss 123.746


Epoch 479: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 478: avg test  loss 1419.97, bar  test loss 2.383, len  test loss 0.029, col  test loss 126.704


Epoch 479: 272batch [00:24, 10.93batch/s, loss=1.4e+3] 


epoch 479: avg train loss 1386.72, bar train loss 2.253, len train loss 0.025, col train loss 123.825


Epoch 480: 0batch [00:00, ?batch/s, loss=1.35e+3]

epoch 479: avg test  loss 1419.79, bar  test loss 2.428, len  test loss 0.027, col  test loss 126.883


Epoch 480: 272batch [00:24, 10.89batch/s, loss=1.37e+3]


epoch 480: avg train loss 1387.00, bar train loss 2.260, len train loss 0.025, col train loss 123.868
epoch 480: avg test  loss 1420.05, bar  test loss 2.519, len  test loss 0.031, col  test loss 127.100


Epoch 481: 272batch [00:26, 10.13batch/s, loss=1.43e+3]


epoch 481: avg train loss 1386.33, bar train loss 2.260, len train loss 0.025, col train loss 123.814


Epoch 482: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 481: avg test  loss 1417.20, bar  test loss 2.458, len  test loss 0.031, col  test loss 126.692


Epoch 482: 272batch [00:24, 10.94batch/s, loss=1.37e+3]


epoch 482: avg train loss 1386.33, bar train loss 2.248, len train loss 0.024, col train loss 123.778


Epoch 483: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 482: avg test  loss 1419.74, bar  test loss 2.494, len  test loss 0.029, col  test loss 126.951


Epoch 483: 272batch [00:24, 10.90batch/s, loss=1.36e+3]


epoch 483: avg train loss 1385.69, bar train loss 2.253, len train loss 0.025, col train loss 123.742


Epoch 484: 0batch [00:00, ?batch/s, loss=1.35e+3]

epoch 483: avg test  loss 1417.81, bar  test loss 2.438, len  test loss 0.027, col  test loss 126.638


Epoch 484: 272batch [00:25, 10.86batch/s, loss=1.49e+3]


epoch 484: avg train loss 1386.87, bar train loss 2.248, len train loss 0.025, col train loss 123.822


Epoch 485: 0batch [00:00, ?batch/s, loss=1.35e+3]

epoch 484: avg test  loss 1418.34, bar  test loss 2.455, len  test loss 0.029, col  test loss 126.831


Epoch 485: 272batch [00:25, 10.88batch/s, loss=1.5e+3] 


epoch 485: avg train loss 1386.52, bar train loss 2.260, len train loss 0.025, col train loss 123.801
epoch 485: avg test  loss 1419.12, bar  test loss 2.508, len  test loss 0.033, col  test loss 127.200


Epoch 486: 272batch [00:26, 10.21batch/s, loss=1.44e+3]


epoch 486: avg train loss 1386.96, bar train loss 2.264, len train loss 0.026, col train loss 123.809


Epoch 487: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 486: avg test  loss 1421.41, bar  test loss 2.454, len  test loss 0.030, col  test loss 126.815


Epoch 487: 272batch [00:25, 10.86batch/s, loss=1.47e+3]


epoch 487: avg train loss 1386.44, bar train loss 2.243, len train loss 0.025, col train loss 123.751


Epoch 488: 0batch [00:00, ?batch/s, loss=1.34e+3]

epoch 487: avg test  loss 1419.41, bar  test loss 2.466, len  test loss 0.027, col  test loss 126.824


Epoch 488: 272batch [00:24, 10.88batch/s, loss=1.32e+3]


epoch 488: avg train loss 1386.56, bar train loss 2.264, len train loss 0.025, col train loss 123.805


Epoch 489: 0batch [00:00, ?batch/s, loss=1.36e+3]

epoch 488: avg test  loss 1421.91, bar  test loss 2.490, len  test loss 0.030, col  test loss 127.616


Epoch 489: 272batch [00:25, 10.87batch/s, loss=1.56e+3]


epoch 489: avg train loss 1386.23, bar train loss 2.250, len train loss 0.025, col train loss 123.759


Epoch 490: 0batch [00:00, ?batch/s, loss=1.35e+3]

epoch 489: avg test  loss 1420.02, bar  test loss 2.446, len  test loss 0.030, col  test loss 126.936


Epoch 490: 272batch [00:25, 10.85batch/s, loss=1.32e+3]


epoch 490: avg train loss 1386.70, bar train loss 2.244, len train loss 0.024, col train loss 123.765
epoch 490: avg test  loss 1419.58, bar  test loss 2.515, len  test loss 0.029, col  test loss 127.110


Epoch 491: 272batch [00:27,  9.80batch/s, loss=1.46e+3]


epoch 491: avg train loss 1386.77, bar train loss 2.253, len train loss 0.025, col train loss 123.820


Epoch 492: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 491: avg test  loss 1420.06, bar  test loss 2.578, len  test loss 0.028, col  test loss 126.661


Epoch 492: 272batch [00:25, 10.83batch/s, loss=1.37e+3]


epoch 492: avg train loss 1386.48, bar train loss 2.257, len train loss 0.025, col train loss 123.771


Epoch 493: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 492: avg test  loss 1421.73, bar  test loss 2.477, len  test loss 0.028, col  test loss 127.250


Epoch 493: 272batch [00:25, 10.83batch/s, loss=1.48e+3]


epoch 493: avg train loss 1386.53, bar train loss 2.261, len train loss 0.025, col train loss 123.758


Epoch 494: 0batch [00:00, ?batch/s, loss=1.36e+3]

epoch 493: avg test  loss 1419.28, bar  test loss 2.462, len  test loss 0.028, col  test loss 126.701


Epoch 494: 272batch [00:25, 10.75batch/s, loss=1.33e+3]


epoch 494: avg train loss 1386.49, bar train loss 2.262, len train loss 0.025, col train loss 123.729


Epoch 495: 1batch [00:00, 10.00batch/s, loss=1.39e+3]

epoch 494: avg test  loss 1421.03, bar  test loss 2.522, len  test loss 0.029, col  test loss 126.942


Epoch 495: 272batch [00:25, 10.80batch/s, loss=1.31e+3]


epoch 495: avg train loss 1386.52, bar train loss 2.262, len train loss 0.026, col train loss 123.761
epoch 495: avg test  loss 1418.36, bar  test loss 2.463, len  test loss 0.029, col  test loss 126.729


Epoch 496: 272batch [00:27,  9.93batch/s, loss=1.3e+3] 


epoch 496: avg train loss 1386.87, bar train loss 2.265, len train loss 0.025, col train loss 123.791


Epoch 497: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 496: avg test  loss 1419.54, bar  test loss 2.452, len  test loss 0.031, col  test loss 126.970


Epoch 497: 272batch [00:25, 10.68batch/s, loss=1.48e+3]


epoch 497: avg train loss 1386.48, bar train loss 2.258, len train loss 0.025, col train loss 123.749


Epoch 498: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 497: avg test  loss 1423.59, bar  test loss 2.570, len  test loss 0.030, col  test loss 127.361


Epoch 498: 272batch [00:25, 10.77batch/s, loss=1.36e+3]


epoch 498: avg train loss 1387.55, bar train loss 2.259, len train loss 0.025, col train loss 123.805


Epoch 499: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 498: avg test  loss 1421.13, bar  test loss 2.485, len  test loss 0.030, col  test loss 127.087


Epoch 499: 272batch [00:25, 10.79batch/s, loss=1.27e+3]


epoch 499: avg train loss 1387.12, bar train loss 2.264, len train loss 0.025, col train loss 123.742


Epoch 500: 0batch [00:00, ?batch/s, loss=1.48e+3]

epoch 499: avg test  loss 1424.14, bar  test loss 2.554, len  test loss 0.029, col  test loss 127.000


Epoch 500: 272batch [00:25, 10.72batch/s, loss=1.27e+3]


epoch 500: avg train loss 1387.30, bar train loss 2.270, len train loss 0.025, col train loss 123.830
epoch 500: avg test  loss 1421.55, bar  test loss 2.448, len  test loss 0.028, col  test loss 127.118


Epoch 501: 272batch [00:28,  9.58batch/s, loss=1.45e+3]


epoch 501: avg train loss 1387.07, bar train loss 2.262, len train loss 0.025, col train loss 123.827


Epoch 502: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 501: avg test  loss 1421.33, bar  test loss 2.402, len  test loss 0.028, col  test loss 126.778


Epoch 502: 272batch [00:25, 10.68batch/s, loss=1.36e+3]


epoch 502: avg train loss 1386.83, bar train loss 2.262, len train loss 0.025, col train loss 123.764


Epoch 503: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 502: avg test  loss 1421.39, bar  test loss 2.524, len  test loss 0.028, col  test loss 126.504


Epoch 503: 272batch [00:25, 10.68batch/s, loss=1.34e+3]


epoch 503: avg train loss 1386.91, bar train loss 2.259, len train loss 0.025, col train loss 123.770


Epoch 504: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 503: avg test  loss 1420.76, bar  test loss 2.462, len  test loss 0.030, col  test loss 126.866


Epoch 504: 272batch [00:25, 10.53batch/s, loss=1.44e+3]


epoch 504: avg train loss 1387.46, bar train loss 2.271, len train loss 0.025, col train loss 123.848


Epoch 505: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 504: avg test  loss 1423.71, bar  test loss 2.504, len  test loss 0.030, col  test loss 127.054


Epoch 505: 272batch [00:25, 10.68batch/s, loss=1.32e+3]


epoch 505: avg train loss 1386.90, bar train loss 2.255, len train loss 0.025, col train loss 123.743
epoch 505: avg test  loss 1420.69, bar  test loss 2.506, len  test loss 0.027, col  test loss 126.881


Epoch 506: 272batch [00:27,  9.81batch/s, loss=1.34e+3]


epoch 506: avg train loss 1387.09, bar train loss 2.268, len train loss 0.025, col train loss 123.755


Epoch 507: 1batch [00:00, 10.00batch/s, loss=1.3e+3]

epoch 506: avg test  loss 1420.29, bar  test loss 2.405, len  test loss 0.028, col  test loss 126.785


Epoch 507: 272batch [00:25, 10.70batch/s, loss=1.48e+3]


epoch 507: avg train loss 1387.38, bar train loss 2.269, len train loss 0.026, col train loss 123.811


Epoch 508: 1batch [00:00,  9.71batch/s, loss=1.38e+3]

epoch 507: avg test  loss 1420.18, bar  test loss 2.502, len  test loss 0.028, col  test loss 126.772


Epoch 508: 272batch [00:25, 10.76batch/s, loss=1.43e+3]


epoch 508: avg train loss 1387.42, bar train loss 2.269, len train loss 0.025, col train loss 123.794


Epoch 509: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 508: avg test  loss 1418.62, bar  test loss 2.409, len  test loss 0.028, col  test loss 126.529


Epoch 509: 272batch [00:25, 10.69batch/s, loss=1.4e+3] 


epoch 509: avg train loss 1387.45, bar train loss 2.256, len train loss 0.025, col train loss 123.768


Epoch 510: 0batch [00:00, ?batch/s, loss=1.47e+3]

epoch 509: avg test  loss 1420.89, bar  test loss 2.487, len  test loss 0.031, col  test loss 126.601


Epoch 510: 272batch [00:25, 10.69batch/s, loss=1.38e+3]


epoch 510: avg train loss 1387.76, bar train loss 2.273, len train loss 0.026, col train loss 123.839
epoch 510: avg test  loss 1419.22, bar  test loss 2.424, len  test loss 0.031, col  test loss 126.788


Epoch 511: 272batch [00:28,  9.69batch/s, loss=1.29e+3]


epoch 511: avg train loss 1387.92, bar train loss 2.263, len train loss 0.025, col train loss 123.832


Epoch 512: 0batch [00:00, ?batch/s, loss=1.35e+3]

epoch 511: avg test  loss 1420.32, bar  test loss 2.501, len  test loss 0.030, col  test loss 126.776


Epoch 512: 272batch [00:25, 10.65batch/s, loss=1.47e+3]


epoch 512: avg train loss 1387.44, bar train loss 2.269, len train loss 0.025, col train loss 123.787


Epoch 513: 1batch [00:00,  9.80batch/s, loss=1.4e+3]

epoch 512: avg test  loss 1422.28, bar  test loss 2.541, len  test loss 0.030, col  test loss 127.008


Epoch 513: 272batch [00:25, 10.61batch/s, loss=1.34e+3]


epoch 513: avg train loss 1388.03, bar train loss 2.268, len train loss 0.025, col train loss 123.844


Epoch 514: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 513: avg test  loss 1418.95, bar  test loss 2.469, len  test loss 0.028, col  test loss 127.120


Epoch 514: 272batch [00:25, 10.67batch/s, loss=1.37e+3]


epoch 514: avg train loss 1388.08, bar train loss 2.271, len train loss 0.025, col train loss 123.859


Epoch 515: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 514: avg test  loss 1421.02, bar  test loss 2.441, len  test loss 0.031, col  test loss 127.196


Epoch 515: 272batch [00:25, 10.64batch/s, loss=1.42e+3]


epoch 515: avg train loss 1388.54, bar train loss 2.265, len train loss 0.025, col train loss 123.886
epoch 515: avg test  loss 1424.02, bar  test loss 2.561, len  test loss 0.029, col  test loss 127.220


Epoch 516: 272batch [00:28,  9.43batch/s, loss=1.36e+3]


epoch 516: avg train loss 1387.87, bar train loss 2.270, len train loss 0.025, col train loss 123.797


Epoch 517: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 516: avg test  loss 1422.56, bar  test loss 2.507, len  test loss 0.028, col  test loss 127.201


Epoch 517: 272batch [00:25, 10.60batch/s, loss=1.39e+3]


epoch 517: avg train loss 1388.20, bar train loss 2.263, len train loss 0.025, col train loss 123.864


Epoch 518: 0batch [00:00, ?batch/s, loss=1.36e+3]

epoch 517: avg test  loss 1420.66, bar  test loss 2.548, len  test loss 0.029, col  test loss 126.974


Epoch 518: 272batch [00:25, 10.66batch/s, loss=1.45e+3]


epoch 518: avg train loss 1388.31, bar train loss 2.276, len train loss 0.025, col train loss 123.849


Epoch 519: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 518: avg test  loss 1423.54, bar  test loss 2.535, len  test loss 0.034, col  test loss 127.184


Epoch 519: 272batch [00:25, 10.57batch/s, loss=1.45e+3]


epoch 519: avg train loss 1388.86, bar train loss 2.273, len train loss 0.025, col train loss 123.874


Epoch 520: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 519: avg test  loss 1421.67, bar  test loss 2.535, len  test loss 0.029, col  test loss 127.017


Epoch 520: 272batch [00:25, 10.57batch/s, loss=1.36e+3]


epoch 520: avg train loss 1388.09, bar train loss 2.271, len train loss 0.025, col train loss 123.842
epoch 520: avg test  loss 1419.81, bar  test loss 2.500, len  test loss 0.028, col  test loss 127.168


Epoch 521: 272batch [00:28,  9.41batch/s, loss=1.33e+3]


epoch 521: avg train loss 1388.29, bar train loss 2.272, len train loss 0.025, col train loss 123.801


Epoch 522: 0batch [00:00, ?batch/s, loss=1.46e+3]

epoch 521: avg test  loss 1421.49, bar  test loss 2.463, len  test loss 0.029, col  test loss 127.102


Epoch 522: 272batch [00:26, 10.19batch/s, loss=1.39e+3]


epoch 522: avg train loss 1389.10, bar train loss 2.271, len train loss 0.025, col train loss 123.909


Epoch 523: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 522: avg test  loss 1421.99, bar  test loss 2.499, len  test loss 0.030, col  test loss 127.050


Epoch 523: 272batch [00:25, 10.59batch/s, loss=1.37e+3]


epoch 523: avg train loss 1388.88, bar train loss 2.282, len train loss 0.025, col train loss 123.911


Epoch 524: 0batch [00:00, ?batch/s, loss=1.48e+3]

epoch 523: avg test  loss 1420.58, bar  test loss 2.439, len  test loss 0.029, col  test loss 127.361


Epoch 524: 272batch [00:24, 10.92batch/s, loss=1.53e+3]


epoch 524: avg train loss 1389.07, bar train loss 2.268, len train loss 0.025, col train loss 123.885


Epoch 525: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 524: avg test  loss 1421.86, bar  test loss 2.513, len  test loss 0.030, col  test loss 127.485


Epoch 525: 272batch [00:24, 10.93batch/s, loss=1.32e+3]


epoch 525: avg train loss 1388.56, bar train loss 2.273, len train loss 0.025, col train loss 123.870
epoch 525: avg test  loss 1425.58, bar  test loss 2.447, len  test loss 0.030, col  test loss 127.206


Epoch 526: 272batch [00:24, 10.92batch/s, loss=1.39e+3]


epoch 526: avg train loss 1388.85, bar train loss 2.277, len train loss 0.025, col train loss 123.856


Epoch 527: 0batch [00:00, ?batch/s, loss=1.36e+3]

epoch 526: avg test  loss 1423.52, bar  test loss 2.436, len  test loss 0.029, col  test loss 127.017


Epoch 527: 272batch [00:24, 10.89batch/s, loss=1.42e+3]


epoch 527: avg train loss 1389.57, bar train loss 2.291, len train loss 0.026, col train loss 123.930


Epoch 528: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 527: avg test  loss 1423.75, bar  test loss 2.639, len  test loss 0.031, col  test loss 127.069


Epoch 528: 272batch [00:24, 10.90batch/s, loss=1.41e+3]


epoch 528: avg train loss 1389.70, bar train loss 2.300, len train loss 0.025, col train loss 124.020


Epoch 529: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 528: avg test  loss 1422.18, bar  test loss 2.581, len  test loss 0.028, col  test loss 126.978


Epoch 529: 272batch [00:25, 10.79batch/s, loss=1.33e+3]


epoch 529: avg train loss 1389.73, bar train loss 2.281, len train loss 0.025, col train loss 123.995


Epoch 530: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 529: avg test  loss 1422.87, bar  test loss 2.476, len  test loss 0.032, col  test loss 127.212


Epoch 530: 272batch [00:25, 10.84batch/s, loss=1.43e+3]


epoch 530: avg train loss 1388.91, bar train loss 2.272, len train loss 0.025, col train loss 123.911
epoch 530: avg test  loss 1421.91, bar  test loss 2.487, len  test loss 0.035, col  test loss 127.119


Epoch 531: 272batch [00:24, 10.89batch/s, loss=1.46e+3]


epoch 531: avg train loss 1389.74, bar train loss 2.295, len train loss 0.026, col train loss 123.978


Epoch 532: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 531: avg test  loss 1421.23, bar  test loss 2.613, len  test loss 0.030, col  test loss 127.132


Epoch 532: 272batch [00:25, 10.86batch/s, loss=1.46e+3]


epoch 532: avg train loss 1389.83, bar train loss 2.277, len train loss 0.025, col train loss 124.017


Epoch 533: 0batch [00:00, ?batch/s, loss=1.36e+3]

epoch 532: avg test  loss 1423.46, bar  test loss 2.513, len  test loss 0.030, col  test loss 127.295


Epoch 533: 272batch [00:25, 10.82batch/s, loss=1.37e+3]


epoch 533: avg train loss 1389.70, bar train loss 2.278, len train loss 0.025, col train loss 124.002


Epoch 534: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 533: avg test  loss 1421.57, bar  test loss 2.406, len  test loss 0.027, col  test loss 126.956


Epoch 534: 272batch [00:25, 10.79batch/s, loss=1.45e+3]


epoch 534: avg train loss 1389.44, bar train loss 2.289, len train loss 0.025, col train loss 123.955


Epoch 535: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 534: avg test  loss 1422.66, bar  test loss 2.473, len  test loss 0.029, col  test loss 126.989


Epoch 535: 272batch [00:25, 10.66batch/s, loss=1.38e+3]


epoch 535: avg train loss 1390.30, bar train loss 2.286, len train loss 0.025, col train loss 124.019
epoch 535: avg test  loss 1427.29, bar  test loss 2.579, len  test loss 0.031, col  test loss 126.947


Epoch 536: 272batch [00:25, 10.83batch/s, loss=1.41e+3]


epoch 536: avg train loss 1391.11, bar train loss 2.294, len train loss 0.025, col train loss 124.114


Epoch 537: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 536: avg test  loss 1422.10, bar  test loss 2.511, len  test loss 0.029, col  test loss 127.011


Epoch 537: 272batch [00:24, 10.89batch/s, loss=1.46e+3]


epoch 537: avg train loss 1390.19, bar train loss 2.274, len train loss 0.025, col train loss 123.955


Epoch 538: 0batch [00:00, ?batch/s, loss=1.34e+3]

epoch 537: avg test  loss 1423.39, bar  test loss 2.568, len  test loss 0.031, col  test loss 127.294


Epoch 538: 272batch [00:25, 10.79batch/s, loss=1.44e+3]


epoch 538: avg train loss 1391.51, bar train loss 2.303, len train loss 0.025, col train loss 124.142


Epoch 539: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 538: avg test  loss 1424.28, bar  test loss 2.487, len  test loss 0.028, col  test loss 127.142


Epoch 539: 272batch [00:25, 10.80batch/s, loss=1.4e+3] 


epoch 539: avg train loss 1391.13, bar train loss 2.292, len train loss 0.025, col train loss 124.069


Epoch 540: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 539: avg test  loss 1422.12, bar  test loss 2.518, len  test loss 0.028, col  test loss 127.003


Epoch 540: 272batch [00:25, 10.81batch/s, loss=1.38e+3]


epoch 540: avg train loss 1390.26, bar train loss 2.286, len train loss 0.026, col train loss 124.034
epoch 540: avg test  loss 1425.28, bar  test loss 2.654, len  test loss 0.029, col  test loss 127.041


Epoch 541: 272batch [00:25, 10.79batch/s, loss=1.36e+3]


epoch 541: avg train loss 1390.65, bar train loss 2.285, len train loss 0.025, col train loss 124.096


Epoch 542: 0batch [00:00, ?batch/s, loss=1.35e+3]

epoch 541: avg test  loss 1421.51, bar  test loss 2.447, len  test loss 0.029, col  test loss 126.846


Epoch 542: 272batch [00:25, 10.82batch/s, loss=1.48e+3]


epoch 542: avg train loss 1391.58, bar train loss 2.284, len train loss 0.026, col train loss 124.110


Epoch 543: 0batch [00:00, ?batch/s, loss=1.45e+3]

epoch 542: avg test  loss 1426.23, bar  test loss 2.524, len  test loss 0.029, col  test loss 127.396


Epoch 543: 272batch [00:25, 10.69batch/s, loss=1.33e+3]


epoch 543: avg train loss 1391.72, bar train loss 2.293, len train loss 0.026, col train loss 124.143


Epoch 544: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 543: avg test  loss 1423.63, bar  test loss 2.475, len  test loss 0.028, col  test loss 127.230


Epoch 544: 272batch [00:25, 10.82batch/s, loss=1.51e+3]


epoch 544: avg train loss 1392.29, bar train loss 2.318, len train loss 0.026, col train loss 124.160


Epoch 545: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 544: avg test  loss 1423.36, bar  test loss 2.492, len  test loss 0.031, col  test loss 127.237


Epoch 545: 272batch [00:25, 10.75batch/s, loss=1.46e+3]


epoch 545: avg train loss 1391.90, bar train loss 2.300, len train loss 0.026, col train loss 124.123
epoch 545: avg test  loss 1425.19, bar  test loss 2.502, len  test loss 0.029, col  test loss 127.133


Epoch 546: 272batch [00:25, 10.75batch/s, loss=1.45e+3]


epoch 546: avg train loss 1391.60, bar train loss 2.289, len train loss 0.025, col train loss 124.105


Epoch 547: 0batch [00:00, ?batch/s, loss=1.35e+3]

epoch 546: avg test  loss 1423.58, bar  test loss 2.504, len  test loss 0.030, col  test loss 127.456


Epoch 547: 272batch [00:25, 10.74batch/s, loss=1.42e+3]


epoch 547: avg train loss 1392.27, bar train loss 2.322, len train loss 0.026, col train loss 124.207


Epoch 548: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 547: avg test  loss 1423.35, bar  test loss 2.467, len  test loss 0.028, col  test loss 126.926


Epoch 548: 272batch [00:25, 10.74batch/s, loss=1.43e+3]


epoch 548: avg train loss 1392.07, bar train loss 2.316, len train loss 0.025, col train loss 124.150


Epoch 549: 1batch [00:00, 10.00batch/s, loss=1.39e+3]

epoch 548: avg test  loss 1422.75, bar  test loss 2.526, len  test loss 0.030, col  test loss 127.109


Epoch 549: 272batch [00:25, 10.70batch/s, loss=1.44e+3]


epoch 549: avg train loss 1392.39, bar train loss 2.311, len train loss 0.026, col train loss 124.172


Epoch 550: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 549: avg test  loss 1424.46, bar  test loss 2.501, len  test loss 0.030, col  test loss 127.047


Epoch 550: 272batch [00:25, 10.70batch/s, loss=1.49e+3]


epoch 550: avg train loss 1392.10, bar train loss 2.299, len train loss 0.026, col train loss 124.147
epoch 550: avg test  loss 1426.14, bar  test loss 2.598, len  test loss 0.029, col  test loss 127.654


Epoch 551: 272batch [00:25, 10.68batch/s, loss=1.44e+3]


epoch 551: avg train loss 1392.65, bar train loss 2.299, len train loss 0.025, col train loss 124.230


Epoch 552: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 551: avg test  loss 1426.28, bar  test loss 2.528, len  test loss 0.029, col  test loss 127.465


Epoch 552: 272batch [00:25, 10.71batch/s, loss=1.41e+3]


epoch 552: avg train loss 1393.50, bar train loss 2.297, len train loss 0.026, col train loss 124.354


Epoch 553: 0batch [00:00, ?batch/s, loss=1.35e+3]

epoch 552: avg test  loss 1423.50, bar  test loss 2.479, len  test loss 0.028, col  test loss 127.240


Epoch 553: 272batch [00:25, 10.61batch/s, loss=1.49e+3]


epoch 553: avg train loss 1392.77, bar train loss 2.314, len train loss 0.025, col train loss 124.230


Epoch 554: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 553: avg test  loss 1423.73, bar  test loss 2.477, len  test loss 0.029, col  test loss 127.078


Epoch 554: 272batch [00:25, 10.70batch/s, loss=1.34e+3]


epoch 554: avg train loss 1393.85, bar train loss 2.310, len train loss 0.025, col train loss 124.375


Epoch 555: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 554: avg test  loss 1429.48, bar  test loss 2.786, len  test loss 0.029, col  test loss 127.427


Epoch 555: 272batch [00:25, 10.65batch/s, loss=1.35e+3]


epoch 555: avg train loss 1394.03, bar train loss 2.325, len train loss 0.026, col train loss 124.311
epoch 555: avg test  loss 1423.46, bar  test loss 2.492, len  test loss 0.029, col  test loss 127.036


Epoch 556: 272batch [00:25, 10.65batch/s, loss=1.41e+3]


epoch 556: avg train loss 1394.28, bar train loss 2.317, len train loss 0.026, col train loss 124.391


Epoch 557: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 556: avg test  loss 1424.87, bar  test loss 2.624, len  test loss 0.029, col  test loss 127.516


Epoch 557: 272batch [00:25, 10.64batch/s, loss=1.31e+3]


epoch 557: avg train loss 1393.15, bar train loss 2.309, len train loss 0.026, col train loss 124.233


Epoch 558: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 557: avg test  loss 1426.00, bar  test loss 2.546, len  test loss 0.030, col  test loss 127.629


Epoch 558: 272batch [00:25, 10.61batch/s, loss=1.32e+3]


epoch 558: avg train loss 1393.58, bar train loss 2.315, len train loss 0.025, col train loss 124.318


Epoch 559: 1batch [00:00,  9.80batch/s, loss=1.36e+3]

epoch 558: avg test  loss 1425.94, bar  test loss 2.551, len  test loss 0.028, col  test loss 127.696


Epoch 559: 272batch [00:25, 10.68batch/s, loss=1.31e+3]


epoch 559: avg train loss 1394.50, bar train loss 2.312, len train loss 0.025, col train loss 124.436


Epoch 560: 0batch [00:00, ?batch/s, loss=1.46e+3]

epoch 559: avg test  loss 1426.09, bar  test loss 2.488, len  test loss 0.029, col  test loss 127.583


Epoch 560: 272batch [00:25, 10.72batch/s, loss=1.4e+3] 


epoch 560: avg train loss 1394.57, bar train loss 2.331, len train loss 0.025, col train loss 124.377
epoch 560: avg test  loss 1426.77, bar  test loss 2.468, len  test loss 0.029, col  test loss 127.057


Epoch 561: 272batch [00:25, 10.62batch/s, loss=1.31e+3]


epoch 561: avg train loss 1395.58, bar train loss 2.346, len train loss 0.026, col train loss 124.527


Epoch 562: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 561: avg test  loss 1428.85, bar  test loss 2.598, len  test loss 0.028, col  test loss 127.598


Epoch 562: 272batch [00:25, 10.66batch/s, loss=1.35e+3]


epoch 562: avg train loss 1394.60, bar train loss 2.324, len train loss 0.025, col train loss 124.295


Epoch 563: 0batch [00:00, ?batch/s, loss=1.36e+3]

epoch 562: avg test  loss 1425.90, bar  test loss 2.467, len  test loss 0.029, col  test loss 127.785


Epoch 563: 272batch [00:25, 10.63batch/s, loss=1.37e+3]


epoch 563: avg train loss 1394.99, bar train loss 2.326, len train loss 0.026, col train loss 124.453


Epoch 564: 1batch [00:00,  9.71batch/s, loss=1.4e+3]

epoch 563: avg test  loss 1426.85, bar  test loss 2.507, len  test loss 0.030, col  test loss 127.503


Epoch 564: 272batch [00:25, 10.59batch/s, loss=1.35e+3]


epoch 564: avg train loss 1394.81, bar train loss 2.326, len train loss 0.025, col train loss 124.446


Epoch 565: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 564: avg test  loss 1425.02, bar  test loss 2.539, len  test loss 0.030, col  test loss 126.946


Epoch 565: 272batch [00:26, 10.15batch/s, loss=1.51e+3]


epoch 565: avg train loss 1395.02, bar train loss 2.327, len train loss 0.026, col train loss 124.378
epoch 565: avg test  loss 1429.00, bar  test loss 2.498, len  test loss 0.031, col  test loss 127.285


Epoch 566: 272batch [00:25, 10.61batch/s, loss=1.32e+3]


epoch 566: avg train loss 1395.95, bar train loss 2.324, len train loss 0.025, col train loss 124.531


Epoch 567: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 566: avg test  loss 1428.23, bar  test loss 2.590, len  test loss 0.031, col  test loss 127.503


Epoch 567: 272batch [00:25, 10.59batch/s, loss=1.36e+3]


epoch 567: avg train loss 1396.42, bar train loss 2.327, len train loss 0.026, col train loss 124.557


Epoch 568: 0batch [00:00, ?batch/s, loss=1.44e+3]

epoch 567: avg test  loss 1426.65, bar  test loss 2.546, len  test loss 0.029, col  test loss 127.280


Epoch 568: 272batch [00:25, 10.61batch/s, loss=1.36e+3]


epoch 568: avg train loss 1395.78, bar train loss 2.325, len train loss 0.026, col train loss 124.559


Epoch 569: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 568: avg test  loss 1427.95, bar  test loss 2.539, len  test loss 0.030, col  test loss 127.803


Epoch 569: 272batch [00:26, 10.43batch/s, loss=1.38e+3]


epoch 569: avg train loss 1396.20, bar train loss 2.342, len train loss 0.026, col train loss 124.492


Epoch 570: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 569: avg test  loss 1427.75, bar  test loss 2.504, len  test loss 0.030, col  test loss 127.498


Epoch 570: 272batch [00:25, 10.58batch/s, loss=1.47e+3]


epoch 570: avg train loss 1397.25, bar train loss 2.330, len train loss 0.026, col train loss 124.631
epoch 570: avg test  loss 1428.57, bar  test loss 2.562, len  test loss 0.031, col  test loss 127.532


Epoch 571: 272batch [00:25, 10.58batch/s, loss=1.31e+3]


epoch 571: avg train loss 1396.84, bar train loss 2.323, len train loss 0.026, col train loss 124.602


Epoch 572: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 571: avg test  loss 1429.88, bar  test loss 2.539, len  test loss 0.029, col  test loss 128.141


Epoch 572: 272batch [00:25, 10.47batch/s, loss=1.4e+3] 


epoch 572: avg train loss 1396.69, bar train loss 2.332, len train loss 0.026, col train loss 124.586


Epoch 573: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 572: avg test  loss 1427.82, bar  test loss 2.682, len  test loss 0.030, col  test loss 127.731


Epoch 573: 272batch [00:25, 10.56batch/s, loss=1.43e+3]


epoch 573: avg train loss 1396.98, bar train loss 2.334, len train loss 0.026, col train loss 124.621


Epoch 574: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 573: avg test  loss 1429.86, bar  test loss 2.586, len  test loss 0.029, col  test loss 127.452


Epoch 574: 272batch [00:25, 10.54batch/s, loss=1.37e+3]


epoch 574: avg train loss 1397.04, bar train loss 2.361, len train loss 0.026, col train loss 124.565


Epoch 575: 0batch [00:00, ?batch/s]

epoch 574: avg test  loss 1427.84, bar  test loss 2.548, len  test loss 0.031, col  test loss 127.205


Epoch 575: 272batch [00:25, 10.54batch/s, loss=1.39e+3]


epoch 575: avg train loss 1397.40, bar train loss 2.334, len train loss 0.026, col train loss 124.623
epoch 575: avg test  loss 1429.77, bar  test loss 2.502, len  test loss 0.030, col  test loss 128.056


Epoch 576: 272batch [00:25, 10.54batch/s, loss=1.32e+3]


epoch 576: avg train loss 1397.44, bar train loss 2.344, len train loss 0.026, col train loss 124.671


Epoch 577: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 576: avg test  loss 1428.24, bar  test loss 2.533, len  test loss 0.031, col  test loss 127.405


Epoch 577: 272batch [00:25, 10.55batch/s, loss=1.38e+3]


epoch 577: avg train loss 1397.59, bar train loss 2.332, len train loss 0.026, col train loss 124.712


Epoch 578: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 577: avg test  loss 1430.97, bar  test loss 2.541, len  test loss 0.031, col  test loss 128.172


Epoch 578: 272batch [00:25, 10.52batch/s, loss=1.38e+3]


epoch 578: avg train loss 1397.47, bar train loss 2.345, len train loss 0.025, col train loss 124.652


Epoch 579: 1batch [00:00,  9.52batch/s, loss=1.37e+3]

epoch 578: avg test  loss 1432.98, bar  test loss 2.732, len  test loss 0.030, col  test loss 128.121


Epoch 579: 272batch [00:25, 10.55batch/s, loss=1.44e+3]


epoch 579: avg train loss 1398.85, bar train loss 2.356, len train loss 0.027, col train loss 124.815


Epoch 580: 0batch [00:00, ?batch/s, loss=1.34e+3]

epoch 579: avg test  loss 1429.24, bar  test loss 2.554, len  test loss 0.029, col  test loss 128.224


Epoch 580: 272batch [00:25, 10.48batch/s, loss=1.33e+3]


epoch 580: avg train loss 1399.81, bar train loss 2.359, len train loss 0.026, col train loss 124.886
epoch 580: avg test  loss 1429.14, bar  test loss 2.559, len  test loss 0.031, col  test loss 127.592


Epoch 581: 272batch [00:26, 10.45batch/s, loss=1.38e+3]


epoch 581: avg train loss 1398.58, bar train loss 2.360, len train loss 0.026, col train loss 124.752


Epoch 582: 0batch [00:00, ?batch/s, loss=1.34e+3]

epoch 581: avg test  loss 1429.76, bar  test loss 2.516, len  test loss 0.031, col  test loss 127.599


Epoch 582: 272batch [00:26, 10.43batch/s, loss=1.48e+3]


epoch 582: avg train loss 1399.36, bar train loss 2.340, len train loss 0.027, col train loss 124.869


Epoch 583: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 582: avg test  loss 1431.06, bar  test loss 2.515, len  test loss 0.033, col  test loss 128.402


Epoch 583: 272batch [00:26, 10.46batch/s, loss=1.39e+3]


epoch 583: avg train loss 1399.29, bar train loss 2.363, len train loss 0.026, col train loss 124.790


Epoch 584: 1batch [00:00,  9.26batch/s, loss=1.32e+3]

epoch 583: avg test  loss 1430.08, bar  test loss 2.554, len  test loss 0.030, col  test loss 127.880


Epoch 584: 272batch [00:26, 10.45batch/s, loss=1.42e+3]


epoch 584: avg train loss 1399.29, bar train loss 2.337, len train loss 0.026, col train loss 124.830


Epoch 585: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 584: avg test  loss 1430.11, bar  test loss 2.552, len  test loss 0.028, col  test loss 127.597


Epoch 585: 272batch [00:26, 10.41batch/s, loss=1.3e+3] 


epoch 585: avg train loss 1399.11, bar train loss 2.351, len train loss 0.026, col train loss 124.790
epoch 585: avg test  loss 1434.58, bar  test loss 3.051, len  test loss 0.030, col  test loss 127.770


Epoch 586: 272batch [00:26, 10.43batch/s, loss=1.36e+3]


epoch 586: avg train loss 1400.07, bar train loss 2.373, len train loss 0.026, col train loss 124.863


Epoch 587: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 586: avg test  loss 1430.70, bar  test loss 2.724, len  test loss 0.032, col  test loss 127.601


Epoch 587: 272batch [00:26, 10.40batch/s, loss=1.41e+3]


epoch 587: avg train loss 1399.67, bar train loss 2.370, len train loss 0.026, col train loss 124.823


Epoch 588: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 587: avg test  loss 1434.10, bar  test loss 2.708, len  test loss 0.031, col  test loss 127.937


Epoch 588: 272batch [00:26, 10.33batch/s, loss=1.47e+3]


epoch 588: avg train loss 1400.72, bar train loss 2.360, len train loss 0.026, col train loss 125.002


Epoch 589: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 588: avg test  loss 1430.99, bar  test loss 2.575, len  test loss 0.033, col  test loss 128.064


Epoch 589: 272batch [00:26, 10.42batch/s, loss=1.34e+3]


epoch 589: avg train loss 1400.05, bar train loss 2.367, len train loss 0.026, col train loss 124.829


Epoch 590: 0batch [00:00, ?batch/s, loss=1.34e+3]

epoch 589: avg test  loss 1430.22, bar  test loss 2.651, len  test loss 0.028, col  test loss 127.671


Epoch 590: 272batch [00:26, 10.41batch/s, loss=1.44e+3]


epoch 590: avg train loss 1401.40, bar train loss 2.368, len train loss 0.027, col train loss 124.976
epoch 590: avg test  loss 1430.41, bar  test loss 2.482, len  test loss 0.029, col  test loss 127.409


Epoch 591: 272batch [00:26, 10.30batch/s, loss=1.43e+3]


epoch 591: avg train loss 1401.13, bar train loss 2.367, len train loss 0.026, col train loss 124.951


Epoch 592: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 591: avg test  loss 1433.36, bar  test loss 2.599, len  test loss 0.029, col  test loss 128.228


Epoch 592: 272batch [00:26, 10.36batch/s, loss=1.39e+3]


epoch 592: avg train loss 1401.60, bar train loss 2.380, len train loss 0.026, col train loss 124.968


Epoch 593: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 592: avg test  loss 1430.88, bar  test loss 2.576, len  test loss 0.030, col  test loss 127.758


Epoch 593: 272batch [00:26, 10.37batch/s, loss=1.41e+3]


epoch 593: avg train loss 1401.42, bar train loss 2.369, len train loss 0.026, col train loss 124.985


Epoch 594: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 593: avg test  loss 1432.97, bar  test loss 2.567, len  test loss 0.030, col  test loss 127.813


Epoch 594: 272batch [00:26, 10.09batch/s, loss=1.43e+3]


epoch 594: avg train loss 1401.90, bar train loss 2.360, len train loss 0.026, col train loss 125.000


Epoch 595: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 594: avg test  loss 1430.82, bar  test loss 2.621, len  test loss 0.029, col  test loss 128.159


Epoch 595: 272batch [00:26, 10.24batch/s, loss=1.37e+3]


epoch 595: avg train loss 1402.42, bar train loss 2.382, len train loss 0.026, col train loss 125.112
epoch 595: avg test  loss 1432.99, bar  test loss 2.528, len  test loss 0.029, col  test loss 127.934


Epoch 596: 272batch [00:26, 10.36batch/s, loss=1.36e+3]


epoch 596: avg train loss 1403.31, bar train loss 2.389, len train loss 0.027, col train loss 125.225


Epoch 597: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 596: avg test  loss 1435.45, bar  test loss 2.618, len  test loss 0.029, col  test loss 128.316


Epoch 597: 272batch [00:26, 10.39batch/s, loss=1.44e+3]


epoch 597: avg train loss 1402.46, bar train loss 2.365, len train loss 0.027, col train loss 125.067


Epoch 598: 1batch [00:00,  9.80batch/s, loss=1.45e+3]

epoch 597: avg test  loss 1432.44, bar  test loss 2.673, len  test loss 0.030, col  test loss 127.985


Epoch 598: 272batch [00:26, 10.38batch/s, loss=1.39e+3]


epoch 598: avg train loss 1402.18, bar train loss 2.384, len train loss 0.026, col train loss 125.126


Epoch 599: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 598: avg test  loss 1432.89, bar  test loss 2.666, len  test loss 0.028, col  test loss 127.778


Epoch 599: 272batch [00:26, 10.37batch/s, loss=1.4e+3] 


epoch 599: avg train loss 1402.81, bar train loss 2.399, len train loss 0.026, col train loss 125.165


Epoch 600: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 599: avg test  loss 1437.06, bar  test loss 2.773, len  test loss 0.029, col  test loss 127.994


Epoch 600: 272batch [00:26, 10.39batch/s, loss=1.39e+3]


epoch 600: avg train loss 1403.53, bar train loss 2.395, len train loss 0.026, col train loss 125.195
epoch 600: avg test  loss 1432.24, bar  test loss 2.618, len  test loss 0.032, col  test loss 127.954


Epoch 601: 272batch [00:26, 10.17batch/s, loss=1.36e+3]


epoch 601: avg train loss 1403.64, bar train loss 2.369, len train loss 0.026, col train loss 125.232


Epoch 602: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 601: avg test  loss 1433.07, bar  test loss 2.525, len  test loss 0.032, col  test loss 127.578


Epoch 602: 272batch [00:26, 10.25batch/s, loss=1.41e+3]


epoch 602: avg train loss 1404.14, bar train loss 2.379, len train loss 0.027, col train loss 125.196


Epoch 603: 1batch [00:00,  9.52batch/s, loss=1.41e+3]

epoch 602: avg test  loss 1432.66, bar  test loss 2.575, len  test loss 0.030, col  test loss 127.830


Epoch 603: 272batch [00:26, 10.33batch/s, loss=1.34e+3]


epoch 603: avg train loss 1404.35, bar train loss 2.378, len train loss 0.026, col train loss 125.245


Epoch 604: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 603: avg test  loss 1431.76, bar  test loss 2.555, len  test loss 0.032, col  test loss 127.767


Epoch 604: 272batch [00:26, 10.34batch/s, loss=1.48e+3]


epoch 604: avg train loss 1403.80, bar train loss 2.374, len train loss 0.026, col train loss 125.253


Epoch 605: 0batch [00:00, ?batch/s, loss=1.44e+3]

epoch 604: avg test  loss 1440.19, bar  test loss 2.755, len  test loss 0.032, col  test loss 128.353


Epoch 605: 272batch [00:26, 10.29batch/s, loss=1.3e+3] 


epoch 605: avg train loss 1405.32, bar train loss 2.388, len train loss 0.026, col train loss 125.348
epoch 605: avg test  loss 1433.98, bar  test loss 2.541, len  test loss 0.029, col  test loss 127.857


Epoch 606: 272batch [00:26, 10.26batch/s, loss=1.44e+3]


epoch 606: avg train loss 1404.13, bar train loss 2.388, len train loss 0.027, col train loss 125.269


Epoch 607: 1batch [00:00,  9.62batch/s, loss=1.37e+3]

epoch 606: avg test  loss 1433.47, bar  test loss 2.546, len  test loss 0.034, col  test loss 128.335


Epoch 607: 272batch [00:26, 10.24batch/s, loss=1.4e+3] 


epoch 607: avg train loss 1405.19, bar train loss 2.395, len train loss 0.027, col train loss 125.395


Epoch 608: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 607: avg test  loss 1434.72, bar  test loss 2.544, len  test loss 0.029, col  test loss 128.131


Epoch 608: 272batch [00:26, 10.12batch/s, loss=1.41e+3]


epoch 608: avg train loss 1405.27, bar train loss 2.391, len train loss 0.026, col train loss 125.447


Epoch 609: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 608: avg test  loss 1440.81, bar  test loss 2.915, len  test loss 0.032, col  test loss 128.615


Epoch 609: 272batch [00:26, 10.19batch/s, loss=1.43e+3]


epoch 609: avg train loss 1404.93, bar train loss 2.405, len train loss 0.026, col train loss 125.399


Epoch 610: 1batch [00:00, 10.00batch/s, loss=1.41e+3]

epoch 609: avg test  loss 1432.95, bar  test loss 2.663, len  test loss 0.031, col  test loss 128.037


Epoch 610: 272batch [00:26, 10.27batch/s, loss=1.38e+3]


epoch 610: avg train loss 1406.02, bar train loss 2.400, len train loss 0.026, col train loss 125.445
epoch 610: avg test  loss 1437.71, bar  test loss 2.519, len  test loss 0.031, col  test loss 127.792


Epoch 611: 272batch [00:27, 10.05batch/s, loss=1.48e+3]


epoch 611: avg train loss 1405.60, bar train loss 2.401, len train loss 0.027, col train loss 125.465


Epoch 612: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 611: avg test  loss 1437.01, bar  test loss 2.658, len  test loss 0.031, col  test loss 128.847


Epoch 612: 272batch [00:26, 10.29batch/s, loss=1.5e+3] 


epoch 612: avg train loss 1406.23, bar train loss 2.402, len train loss 0.027, col train loss 125.452


Epoch 613: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 612: avg test  loss 1436.27, bar  test loss 2.592, len  test loss 0.030, col  test loss 127.851


Epoch 613: 272batch [00:26, 10.24batch/s, loss=1.48e+3]


epoch 613: avg train loss 1405.66, bar train loss 2.404, len train loss 0.027, col train loss 125.418


Epoch 614: 1batch [00:00,  9.71batch/s, loss=1.41e+3]

epoch 613: avg test  loss 1443.20, bar  test loss 2.684, len  test loss 0.031, col  test loss 129.163


Epoch 614: 272batch [00:26, 10.15batch/s, loss=1.33e+3]


epoch 614: avg train loss 1407.21, bar train loss 2.414, len train loss 0.027, col train loss 125.606


Epoch 615: 1batch [00:00, 10.00batch/s, loss=1.45e+3]

epoch 614: avg test  loss 1437.20, bar  test loss 2.731, len  test loss 0.031, col  test loss 128.379


Epoch 615: 272batch [00:26, 10.21batch/s, loss=1.53e+3]


epoch 615: avg train loss 1407.44, bar train loss 2.418, len train loss 0.027, col train loss 125.610
epoch 615: avg test  loss 1434.57, bar  test loss 2.666, len  test loss 0.029, col  test loss 127.992


Epoch 616: 272batch [00:26, 10.09batch/s, loss=1.54e+3]


epoch 616: avg train loss 1407.05, bar train loss 2.423, len train loss 0.027, col train loss 125.587


Epoch 617: 0batch [00:00, ?batch/s, loss=1.44e+3]

epoch 616: avg test  loss 1435.14, bar  test loss 2.586, len  test loss 0.030, col  test loss 128.604


Epoch 617: 272batch [00:26, 10.17batch/s, loss=1.46e+3]


epoch 617: avg train loss 1406.90, bar train loss 2.398, len train loss 0.026, col train loss 125.534


Epoch 618: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 617: avg test  loss 1439.85, bar  test loss 2.547, len  test loss 0.030, col  test loss 128.714


Epoch 618: 272batch [00:26, 10.24batch/s, loss=1.33e+3]


epoch 618: avg train loss 1408.79, bar train loss 2.410, len train loss 0.027, col train loss 125.792


Epoch 619: 0batch [00:00, ?batch/s, loss=1.37e+3]

epoch 618: avg test  loss 1439.85, bar  test loss 2.721, len  test loss 0.030, col  test loss 128.814


Epoch 619: 272batch [00:27,  9.92batch/s, loss=1.43e+3]


epoch 619: avg train loss 1408.82, bar train loss 2.433, len train loss 0.026, col train loss 125.790


Epoch 620: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 619: avg test  loss 1440.11, bar  test loss 2.574, len  test loss 0.030, col  test loss 128.490


Epoch 620: 272batch [00:27,  9.88batch/s, loss=1.48e+3]


epoch 620: avg train loss 1408.75, bar train loss 2.415, len train loss 0.027, col train loss 125.759
epoch 620: avg test  loss 1435.94, bar  test loss 2.647, len  test loss 0.035, col  test loss 128.218


Epoch 621: 272batch [00:27,  9.74batch/s, loss=1.24e+3]


epoch 621: avg train loss 1409.47, bar train loss 2.426, len train loss 0.027, col train loss 125.873


Epoch 622: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 621: avg test  loss 1438.91, bar  test loss 2.628, len  test loss 0.031, col  test loss 128.202


Epoch 622: 272batch [00:28,  9.56batch/s, loss=1.38e+3]


epoch 622: avg train loss 1410.00, bar train loss 2.430, len train loss 0.026, col train loss 125.838


Epoch 623: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 622: avg test  loss 1439.35, bar  test loss 2.759, len  test loss 0.030, col  test loss 128.858


Epoch 623: 272batch [00:28,  9.58batch/s, loss=1.5e+3] 


epoch 623: avg train loss 1409.22, bar train loss 2.429, len train loss 0.027, col train loss 125.831


Epoch 624: 1batch [00:00,  9.62batch/s, loss=1.42e+3]

epoch 623: avg test  loss 1436.17, bar  test loss 2.599, len  test loss 0.031, col  test loss 127.965


Epoch 624: 272batch [00:28,  9.70batch/s, loss=1.44e+3]


epoch 624: avg train loss 1409.61, bar train loss 2.414, len train loss 0.027, col train loss 125.806


Epoch 625: 1batch [00:00,  9.01batch/s, loss=1.38e+3]

epoch 624: avg test  loss 1442.81, bar  test loss 2.620, len  test loss 0.033, col  test loss 129.292


Epoch 625: 272batch [00:28,  9.52batch/s, loss=1.49e+3]


epoch 625: avg train loss 1409.78, bar train loss 2.438, len train loss 0.027, col train loss 125.865
epoch 625: avg test  loss 1438.78, bar  test loss 2.653, len  test loss 0.030, col  test loss 128.515


Epoch 626: 272batch [00:27,  9.92batch/s, loss=1.43e+3]


epoch 626: avg train loss 1411.56, bar train loss 2.440, len train loss 0.028, col train loss 125.949


Epoch 627: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 626: avg test  loss 1438.18, bar  test loss 2.583, len  test loss 0.029, col  test loss 128.422


Epoch 627: 272batch [00:27,  9.82batch/s, loss=1.37e+3]


epoch 627: avg train loss 1410.67, bar train loss 2.445, len train loss 0.027, col train loss 125.927


Epoch 628: 1batch [00:00,  9.90batch/s, loss=1.43e+3]

epoch 627: avg test  loss 1438.51, bar  test loss 2.788, len  test loss 0.030, col  test loss 128.069


Epoch 628: 272batch [00:26, 10.18batch/s, loss=1.47e+3]


epoch 628: avg train loss 1410.46, bar train loss 2.427, len train loss 0.027, col train loss 125.825


Epoch 629: 1batch [00:00,  9.01batch/s, loss=1.41e+3]

epoch 628: avg test  loss 1440.16, bar  test loss 2.737, len  test loss 0.030, col  test loss 128.892


Epoch 629: 272batch [00:27,  9.93batch/s, loss=1.43e+3]


epoch 629: avg train loss 1410.64, bar train loss 2.435, len train loss 0.027, col train loss 126.003


Epoch 630: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 629: avg test  loss 1440.34, bar  test loss 2.696, len  test loss 0.029, col  test loss 128.613


Epoch 630: 272batch [00:27,  9.92batch/s, loss=1.42e+3]


epoch 630: avg train loss 1410.37, bar train loss 2.449, len train loss 0.027, col train loss 125.836
epoch 630: avg test  loss 1438.24, bar  test loss 2.654, len  test loss 0.029, col  test loss 128.228


Epoch 631: 272batch [00:28,  9.68batch/s, loss=1.4e+3] 


epoch 631: avg train loss 1411.52, bar train loss 2.422, len train loss 0.026, col train loss 126.017


Epoch 632: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 631: avg test  loss 1436.54, bar  test loss 2.575, len  test loss 0.029, col  test loss 128.023


Epoch 632: 272batch [00:26, 10.16batch/s, loss=1.42e+3]


epoch 632: avg train loss 1411.98, bar train loss 2.471, len train loss 0.027, col train loss 126.083


Epoch 633: 0batch [00:00, ?batch/s, loss=1.45e+3]

epoch 632: avg test  loss 1441.00, bar  test loss 2.584, len  test loss 0.029, col  test loss 128.578


Epoch 633: 272batch [00:27,  9.87batch/s, loss=1.44e+3]


epoch 633: avg train loss 1411.81, bar train loss 2.440, len train loss 0.027, col train loss 125.978


Epoch 634: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 633: avg test  loss 1440.48, bar  test loss 2.618, len  test loss 0.031, col  test loss 129.023


Epoch 634: 272batch [00:27, 10.07batch/s, loss=1.26e+3]


epoch 634: avg train loss 1412.29, bar train loss 2.451, len train loss 0.027, col train loss 126.152


Epoch 635: 1batch [00:00,  9.80batch/s, loss=1.36e+3]

epoch 634: avg test  loss 1440.02, bar  test loss 2.725, len  test loss 0.029, col  test loss 129.232


Epoch 635: 272batch [00:27,  9.86batch/s, loss=1.6e+3] 


epoch 635: avg train loss 1411.96, bar train loss 2.433, len train loss 0.027, col train loss 126.051
epoch 635: avg test  loss 1438.75, bar  test loss 2.563, len  test loss 0.030, col  test loss 128.433


Epoch 636: 272batch [00:28,  9.65batch/s, loss=1.39e+3]


epoch 636: avg train loss 1412.02, bar train loss 2.425, len train loss 0.027, col train loss 125.973


Epoch 637: 0batch [00:00, ?batch/s, loss=1.36e+3]

epoch 636: avg test  loss 1441.15, bar  test loss 2.531, len  test loss 0.031, col  test loss 128.530


Epoch 637: 272batch [00:27,  9.80batch/s, loss=1.32e+3]


epoch 637: avg train loss 1412.81, bar train loss 2.472, len train loss 0.027, col train loss 126.051


Epoch 638: 1batch [00:00,  9.62batch/s, loss=1.42e+3]

epoch 637: avg test  loss 1440.13, bar  test loss 2.806, len  test loss 0.029, col  test loss 128.332


Epoch 638: 272batch [00:27,  9.91batch/s, loss=1.38e+3]


epoch 638: avg train loss 1412.24, bar train loss 2.465, len train loss 0.028, col train loss 126.106


Epoch 639: 0batch [00:00, ?batch/s, loss=1.35e+3]

epoch 638: avg test  loss 1440.32, bar  test loss 2.528, len  test loss 0.030, col  test loss 128.589


Epoch 639: 272batch [00:28,  9.64batch/s, loss=1.33e+3]


epoch 639: avg train loss 1413.42, bar train loss 2.437, len train loss 0.027, col train loss 126.116


Epoch 640: 1batch [00:00,  9.90batch/s, loss=1.38e+3]

epoch 639: avg test  loss 1439.55, bar  test loss 2.575, len  test loss 0.029, col  test loss 128.202


Epoch 640: 272batch [00:28,  9.62batch/s, loss=1.38e+3]


epoch 640: avg train loss 1413.28, bar train loss 2.454, len train loss 0.027, col train loss 126.149
epoch 640: avg test  loss 1442.70, bar  test loss 2.796, len  test loss 0.031, col  test loss 128.578


Epoch 641: 272batch [00:28,  9.45batch/s, loss=1.48e+3]


epoch 641: avg train loss 1415.04, bar train loss 2.498, len train loss 0.027, col train loss 126.407


Epoch 642: 1batch [00:00,  9.71batch/s, loss=1.34e+3]

epoch 641: avg test  loss 1445.65, bar  test loss 2.754, len  test loss 0.029, col  test loss 129.376


Epoch 642: 272batch [00:28,  9.50batch/s, loss=1.44e+3]


epoch 642: avg train loss 1413.76, bar train loss 2.452, len train loss 0.027, col train loss 126.267


Epoch 643: 0batch [00:00, ?batch/s, loss=1.44e+3]

epoch 642: avg test  loss 1440.87, bar  test loss 2.722, len  test loss 0.030, col  test loss 128.753


Epoch 643: 272batch [00:28,  9.62batch/s, loss=1.43e+3]


epoch 643: avg train loss 1414.09, bar train loss 2.471, len train loss 0.027, col train loss 126.266


Epoch 644: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 643: avg test  loss 1442.92, bar  test loss 2.645, len  test loss 0.029, col  test loss 128.963


Epoch 644: 272batch [00:28,  9.44batch/s, loss=1.3e+3] 


epoch 644: avg train loss 1415.37, bar train loss 2.462, len train loss 0.027, col train loss 126.354


Epoch 645: 0batch [00:00, ?batch/s, loss=1.47e+3]

epoch 644: avg test  loss 1442.99, bar  test loss 2.697, len  test loss 0.032, col  test loss 129.293


Epoch 645: 272batch [00:28,  9.52batch/s, loss=1.35e+3]


epoch 645: avg train loss 1417.02, bar train loss 2.490, len train loss 0.028, col train loss 126.578
epoch 645: avg test  loss 1449.68, bar  test loss 2.645, len  test loss 0.036, col  test loss 129.689


Epoch 646: 272batch [00:28,  9.42batch/s, loss=1.63e+3]


epoch 646: avg train loss 1415.89, bar train loss 2.470, len train loss 0.028, col train loss 126.359


Epoch 647: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 646: avg test  loss 1444.99, bar  test loss 2.583, len  test loss 0.031, col  test loss 129.336


Epoch 647: 272batch [00:28,  9.49batch/s, loss=1.42e+3]


epoch 647: avg train loss 1415.92, bar train loss 2.470, len train loss 0.027, col train loss 126.458


Epoch 648: 1batch [00:00,  9.62batch/s, loss=1.42e+3]

epoch 647: avg test  loss 1441.34, bar  test loss 2.628, len  test loss 0.031, col  test loss 128.853


Epoch 648: 272batch [00:28,  9.47batch/s, loss=1.52e+3]


epoch 648: avg train loss 1416.30, bar train loss 2.470, len train loss 0.027, col train loss 126.473


Epoch 649: 1batch [00:00,  9.26batch/s, loss=1.4e+3]

epoch 648: avg test  loss 1443.39, bar  test loss 2.761, len  test loss 0.029, col  test loss 128.869


Epoch 649: 272batch [00:29,  9.23batch/s, loss=1.43e+3]


epoch 649: avg train loss 1416.77, bar train loss 2.505, len train loss 0.027, col train loss 126.501


Epoch 650: 1batch [00:00,  9.80batch/s, loss=1.48e+3]

epoch 649: avg test  loss 1448.56, bar  test loss 2.772, len  test loss 0.031, col  test loss 129.635


Epoch 650: 272batch [00:28,  9.45batch/s, loss=1.3e+3] 


epoch 650: avg train loss 1416.80, bar train loss 2.478, len train loss 0.027, col train loss 126.522
epoch 650: avg test  loss 1447.31, bar  test loss 2.794, len  test loss 0.032, col  test loss 129.332


Epoch 651: 272batch [00:28,  9.41batch/s, loss=1.45e+3]


epoch 651: avg train loss 1417.89, bar train loss 2.496, len train loss 0.028, col train loss 126.600


Epoch 652: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 651: avg test  loss 1445.52, bar  test loss 2.797, len  test loss 0.029, col  test loss 128.902


Epoch 652: 272batch [00:28,  9.46batch/s, loss=1.56e+3]


epoch 652: avg train loss 1417.91, bar train loss 2.487, len train loss 0.027, col train loss 126.595


Epoch 653: 0batch [00:00, ?batch/s, loss=1.45e+3]

epoch 652: avg test  loss 1447.55, bar  test loss 2.866, len  test loss 0.029, col  test loss 129.238


Epoch 653: 272batch [00:29,  9.37batch/s, loss=1.34e+3]


epoch 653: avg train loss 1418.38, bar train loss 2.502, len train loss 0.028, col train loss 126.686


Epoch 654: 1batch [00:00,  9.90batch/s, loss=1.4e+3]

epoch 653: avg test  loss 1445.38, bar  test loss 2.598, len  test loss 0.031, col  test loss 128.926


Epoch 654: 272batch [00:28,  9.47batch/s, loss=1.35e+3]


epoch 654: avg train loss 1416.66, bar train loss 2.466, len train loss 0.028, col train loss 126.487


Epoch 655: 0batch [00:00, ?batch/s, loss=1.38e+3]

epoch 654: avg test  loss 1443.98, bar  test loss 2.675, len  test loss 0.034, col  test loss 129.405


Epoch 655: 272batch [00:28,  9.41batch/s, loss=1.59e+3]


epoch 655: avg train loss 1418.19, bar train loss 2.508, len train loss 0.028, col train loss 126.691
epoch 655: avg test  loss 1450.51, bar  test loss 3.028, len  test loss 0.032, col  test loss 129.750


Epoch 656: 272batch [00:28,  9.38batch/s, loss=1.49e+3]


epoch 656: avg train loss 1418.30, bar train loss 2.530, len train loss 0.028, col train loss 126.674


Epoch 657: 1batch [00:00,  9.71batch/s, loss=1.44e+3]

epoch 656: avg test  loss 1445.01, bar  test loss 2.791, len  test loss 0.032, col  test loss 129.570


Epoch 657: 272batch [00:29,  9.31batch/s, loss=1.46e+3]


epoch 657: avg train loss 1419.29, bar train loss 2.501, len train loss 0.028, col train loss 126.682


Epoch 658: 0batch [00:00, ?batch/s, loss=1.5e+3]

epoch 657: avg test  loss 1451.63, bar  test loss 2.844, len  test loss 0.033, col  test loss 128.998


Epoch 658: 272batch [00:29,  9.36batch/s, loss=1.3e+3] 


epoch 658: avg train loss 1419.70, bar train loss 2.516, len train loss 0.028, col train loss 126.776


Epoch 659: 1batch [00:00,  9.90batch/s, loss=1.4e+3]

epoch 658: avg test  loss 1452.39, bar  test loss 2.680, len  test loss 0.031, col  test loss 129.773


Epoch 659: 272batch [00:29,  9.31batch/s, loss=1.26e+3]


epoch 659: avg train loss 1420.04, bar train loss 2.516, len train loss 0.028, col train loss 126.696


Epoch 660: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 659: avg test  loss 1446.29, bar  test loss 2.578, len  test loss 0.030, col  test loss 128.977


Epoch 660: 272batch [00:29,  9.31batch/s, loss=1.54e+3]


epoch 660: avg train loss 1420.10, bar train loss 2.518, len train loss 0.028, col train loss 126.874
epoch 660: avg test  loss 1448.55, bar  test loss 2.846, len  test loss 0.030, col  test loss 129.297


Epoch 661: 272batch [00:29,  9.30batch/s, loss=1.33e+3]


epoch 661: avg train loss 1419.92, bar train loss 2.534, len train loss 0.028, col train loss 126.766


Epoch 662: 1batch [00:00,  9.71batch/s, loss=1.42e+3]

epoch 661: avg test  loss 1447.88, bar  test loss 2.763, len  test loss 0.031, col  test loss 129.717


Epoch 662: 272batch [00:29,  9.33batch/s, loss=1.46e+3]


epoch 662: avg train loss 1419.33, bar train loss 2.493, len train loss 0.027, col train loss 126.758


Epoch 663: 0batch [00:00, ?batch/s, loss=1.46e+3]

epoch 662: avg test  loss 1448.18, bar  test loss 2.903, len  test loss 0.031, col  test loss 129.522


Epoch 663: 272batch [00:29,  9.36batch/s, loss=1.38e+3]


epoch 663: avg train loss 1419.59, bar train loss 2.509, len train loss 0.028, col train loss 126.691


Epoch 664: 1batch [00:00,  9.43batch/s, loss=1.39e+3]

epoch 663: avg test  loss 1446.51, bar  test loss 2.795, len  test loss 0.032, col  test loss 128.924


Epoch 664: 272batch [00:29,  9.29batch/s, loss=1.46e+3]


epoch 664: avg train loss 1421.12, bar train loss 2.503, len train loss 0.028, col train loss 126.900


Epoch 665: 1batch [00:00, 10.00batch/s, loss=1.43e+3]

epoch 664: avg test  loss 1450.70, bar  test loss 2.830, len  test loss 0.031, col  test loss 129.523


Epoch 665: 272batch [00:29,  9.30batch/s, loss=1.34e+3]


epoch 665: avg train loss 1420.33, bar train loss 2.532, len train loss 0.027, col train loss 126.778
epoch 665: avg test  loss 1447.34, bar  test loss 2.963, len  test loss 0.031, col  test loss 129.324


Epoch 666: 272batch [00:29,  9.30batch/s, loss=1.47e+3]


epoch 666: avg train loss 1421.60, bar train loss 2.555, len train loss 0.028, col train loss 127.083


Epoch 667: 1batch [00:00,  9.90batch/s, loss=1.46e+3]

epoch 666: avg test  loss 1452.46, bar  test loss 2.726, len  test loss 0.033, col  test loss 129.898


Epoch 667: 272batch [00:29,  9.32batch/s, loss=1.37e+3]


epoch 667: avg train loss 1421.64, bar train loss 2.516, len train loss 0.028, col train loss 126.905


Epoch 668: 1batch [00:00,  9.62batch/s, loss=1.46e+3]

epoch 667: avg test  loss 1451.20, bar  test loss 2.734, len  test loss 0.031, col  test loss 129.536


Epoch 668: 272batch [00:29,  9.33batch/s, loss=1.4e+3] 


epoch 668: avg train loss 1422.16, bar train loss 2.517, len train loss 0.027, col train loss 127.087


Epoch 669: 1batch [00:00,  9.80batch/s, loss=1.42e+3]

epoch 668: avg test  loss 1452.23, bar  test loss 2.772, len  test loss 0.034, col  test loss 129.012


Epoch 669: 272batch [00:29,  9.29batch/s, loss=1.39e+3]


epoch 669: avg train loss 1424.37, bar train loss 2.530, len train loss 0.029, col train loss 127.214


Epoch 670: 0batch [00:00, ?batch/s, loss=1.45e+3]

epoch 669: avg test  loss 1450.53, bar  test loss 2.678, len  test loss 0.033, col  test loss 129.905


Epoch 670: 272batch [00:29,  9.27batch/s, loss=1.5e+3] 


epoch 670: avg train loss 1422.71, bar train loss 2.551, len train loss 0.028, col train loss 127.067
epoch 670: avg test  loss 1450.40, bar  test loss 2.738, len  test loss 0.031, col  test loss 129.828


Epoch 671: 272batch [00:29,  9.28batch/s, loss=1.47e+3]


epoch 671: avg train loss 1423.15, bar train loss 2.592, len train loss 0.028, col train loss 127.178


Epoch 672: 0batch [00:00, ?batch/s]

epoch 671: avg test  loss 1448.72, bar  test loss 2.831, len  test loss 0.032, col  test loss 129.647


Epoch 672: 272batch [00:29,  9.14batch/s, loss=1.27e+3]


epoch 672: avg train loss 1423.27, bar train loss 2.527, len train loss 0.028, col train loss 127.170


Epoch 673: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 672: avg test  loss 1447.72, bar  test loss 2.691, len  test loss 0.030, col  test loss 129.284


Epoch 673: 272batch [00:29,  9.21batch/s, loss=1.38e+3]


epoch 673: avg train loss 1422.74, bar train loss 2.511, len train loss 0.028, col train loss 127.101


Epoch 674: 1batch [00:00,  9.90batch/s, loss=1.41e+3]

epoch 673: avg test  loss 1454.21, bar  test loss 2.962, len  test loss 0.033, col  test loss 129.810


Epoch 674: 272batch [00:29,  9.20batch/s, loss=1.57e+3]


epoch 674: avg train loss 1423.89, bar train loss 2.533, len train loss 0.028, col train loss 127.099


Epoch 675: 1batch [00:00,  9.90batch/s, loss=1.41e+3]

epoch 674: avg test  loss 1448.61, bar  test loss 2.659, len  test loss 0.031, col  test loss 129.333


Epoch 675: 272batch [00:29,  9.16batch/s, loss=1.37e+3]


epoch 675: avg train loss 1423.89, bar train loss 2.511, len train loss 0.028, col train loss 127.220
epoch 675: avg test  loss 1451.46, bar  test loss 2.784, len  test loss 0.032, col  test loss 129.963


Epoch 676: 272batch [00:29,  9.33batch/s, loss=1.45e+3]


epoch 676: avg train loss 1424.79, bar train loss 2.545, len train loss 0.028, col train loss 127.185


Epoch 677: 1batch [00:00,  8.93batch/s, loss=1.45e+3]

epoch 676: avg test  loss 1452.79, bar  test loss 2.690, len  test loss 0.032, col  test loss 129.355


Epoch 677: 272batch [00:29,  9.22batch/s, loss=1.42e+3]


epoch 677: avg train loss 1423.87, bar train loss 2.553, len train loss 0.029, col train loss 127.304


Epoch 678: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 677: avg test  loss 1452.76, bar  test loss 2.641, len  test loss 0.037, col  test loss 129.830


Epoch 678: 272batch [00:29,  9.28batch/s, loss=1.47e+3]


epoch 678: avg train loss 1425.70, bar train loss 2.556, len train loss 0.029, col train loss 127.354


Epoch 679: 1batch [00:00,  9.62batch/s, loss=1.48e+3]

epoch 678: avg test  loss 1451.38, bar  test loss 2.673, len  test loss 0.033, col  test loss 129.702


Epoch 679: 272batch [00:29,  9.13batch/s, loss=1.37e+3]


epoch 679: avg train loss 1424.32, bar train loss 2.548, len train loss 0.028, col train loss 127.262


Epoch 680: 1batch [00:00,  9.62batch/s, loss=1.38e+3]

epoch 679: avg test  loss 1452.68, bar  test loss 2.735, len  test loss 0.032, col  test loss 130.031


Epoch 680: 272batch [00:29,  9.23batch/s, loss=1.35e+3]


epoch 680: avg train loss 1426.02, bar train loss 2.558, len train loss 0.028, col train loss 127.474
epoch 680: avg test  loss 1454.27, bar  test loss 2.857, len  test loss 0.034, col  test loss 129.757


Epoch 681: 272batch [00:29,  9.27batch/s, loss=1.36e+3]


epoch 681: avg train loss 1426.62, bar train loss 2.567, len train loss 0.028, col train loss 127.519


Epoch 682: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 681: avg test  loss 1450.56, bar  test loss 2.713, len  test loss 0.034, col  test loss 130.504


Epoch 682: 272batch [00:29,  9.16batch/s, loss=1.39e+3]


epoch 682: avg train loss 1426.89, bar train loss 2.539, len train loss 0.028, col train loss 127.412


Epoch 683: 1batch [00:00,  9.90batch/s, loss=1.43e+3]

epoch 682: avg test  loss 1454.39, bar  test loss 2.688, len  test loss 0.031, col  test loss 129.668


Epoch 683: 272batch [00:29,  9.26batch/s, loss=1.56e+3]


epoch 683: avg train loss 1427.53, bar train loss 2.585, len train loss 0.028, col train loss 127.554


Epoch 684: 0batch [00:00, ?batch/s, loss=1.47e+3]

epoch 683: avg test  loss 1454.88, bar  test loss 2.880, len  test loss 0.036, col  test loss 130.355


Epoch 684: 272batch [00:29,  9.17batch/s, loss=1.5e+3] 


epoch 684: avg train loss 1427.43, bar train loss 2.571, len train loss 0.029, col train loss 127.571


Epoch 685: 1batch [00:00,  9.62batch/s, loss=1.38e+3]

epoch 684: avg test  loss 1455.97, bar  test loss 2.926, len  test loss 0.035, col  test loss 130.493


Epoch 685: 272batch [00:29,  9.20batch/s, loss=1.39e+3]


epoch 685: avg train loss 1427.96, bar train loss 2.559, len train loss 0.028, col train loss 127.706
epoch 685: avg test  loss 1465.99, bar  test loss 3.562, len  test loss 0.033, col  test loss 130.384


Epoch 686: 272batch [00:29,  9.23batch/s, loss=1.38e+3]


epoch 686: avg train loss 1427.15, bar train loss 2.553, len train loss 0.028, col train loss 127.474


Epoch 687: 0batch [00:00, ?batch/s]

epoch 686: avg test  loss 1456.84, bar  test loss 2.943, len  test loss 0.033, col  test loss 130.018


Epoch 687: 272batch [00:30,  8.98batch/s, loss=1.49e+3]


epoch 687: avg train loss 1427.70, bar train loss 2.563, len train loss 0.028, col train loss 127.596


Epoch 688: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 687: avg test  loss 1449.53, bar  test loss 2.719, len  test loss 0.031, col  test loss 129.654


Epoch 688: 272batch [00:29,  9.24batch/s, loss=1.34e+3]


epoch 688: avg train loss 1428.38, bar train loss 2.548, len train loss 0.029, col train loss 127.677


Epoch 689: 1batch [00:00,  9.26batch/s, loss=1.35e+3]

epoch 688: avg test  loss 1469.80, bar  test loss 3.007, len  test loss 0.055, col  test loss 132.886


Epoch 689: 272batch [00:30,  8.96batch/s, loss=1.42e+3]


epoch 689: avg train loss 1427.80, bar train loss 2.536, len train loss 0.028, col train loss 127.467


Epoch 690: 1batch [00:00,  9.71batch/s, loss=1.37e+3]

epoch 689: avg test  loss 1455.89, bar  test loss 2.736, len  test loss 0.033, col  test loss 130.477


Epoch 690: 272batch [00:29,  9.21batch/s, loss=1.49e+3]


epoch 690: avg train loss 1428.74, bar train loss 2.561, len train loss 0.028, col train loss 127.538
epoch 690: avg test  loss 1452.28, bar  test loss 2.693, len  test loss 0.033, col  test loss 129.634


Epoch 691: 272batch [00:29,  9.15batch/s, loss=1.33e+3]


epoch 691: avg train loss 1428.62, bar train loss 2.580, len train loss 0.030, col train loss 127.696


Epoch 692: 1batch [00:00,  9.62batch/s, loss=1.39e+3]

epoch 691: avg test  loss 1454.68, bar  test loss 2.832, len  test loss 0.033, col  test loss 130.207


Epoch 692: 272batch [00:29,  9.22batch/s, loss=1.49e+3]


epoch 692: avg train loss 1428.21, bar train loss 2.574, len train loss 0.028, col train loss 127.548


Epoch 693: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 692: avg test  loss 1456.37, bar  test loss 3.114, len  test loss 0.032, col  test loss 130.081


Epoch 693: 272batch [00:29,  9.20batch/s, loss=1.44e+3]


epoch 693: avg train loss 1428.51, bar train loss 2.557, len train loss 0.029, col train loss 127.641


Epoch 694: 1batch [00:00,  9.52batch/s, loss=1.44e+3]

epoch 693: avg test  loss 1459.09, bar  test loss 3.260, len  test loss 0.032, col  test loss 129.946


Epoch 694: 272batch [00:29,  9.18batch/s, loss=1.34e+3]


epoch 694: avg train loss 1429.08, bar train loss 2.584, len train loss 0.029, col train loss 127.828


Epoch 695: 1batch [00:00,  9.71batch/s, loss=1.4e+3]

epoch 694: avg test  loss 1455.52, bar  test loss 2.805, len  test loss 0.033, col  test loss 129.713


Epoch 695: 272batch [00:29,  9.19batch/s, loss=1.47e+3]


epoch 695: avg train loss 1429.49, bar train loss 2.586, len train loss 0.029, col train loss 127.767
epoch 695: avg test  loss 1457.59, bar  test loss 2.825, len  test loss 0.035, col  test loss 130.319


Epoch 696: 272batch [00:29,  9.21batch/s, loss=1.44e+3]


epoch 696: avg train loss 1431.01, bar train loss 2.607, len train loss 0.029, col train loss 127.973


Epoch 697: 0batch [00:00, ?batch/s, loss=1.48e+3]

epoch 696: avg test  loss 1460.86, bar  test loss 2.869, len  test loss 0.031, col  test loss 130.558


Epoch 697: 272batch [00:29,  9.18batch/s, loss=1.37e+3]


epoch 697: avg train loss 1430.37, bar train loss 2.572, len train loss 0.028, col train loss 127.862


Epoch 698: 1batch [00:00,  9.80batch/s, loss=1.48e+3]

epoch 697: avg test  loss 1459.46, bar  test loss 2.830, len  test loss 0.031, col  test loss 130.269


Epoch 698: 272batch [00:29,  9.19batch/s, loss=1.56e+3]


epoch 698: avg train loss 1431.65, bar train loss 2.587, len train loss 0.029, col train loss 127.996


Epoch 699: 1batch [00:00,  9.62batch/s, loss=1.46e+3]

epoch 698: avg test  loss 1460.85, bar  test loss 3.198, len  test loss 0.032, col  test loss 130.453


Epoch 699: 272batch [00:29,  9.12batch/s, loss=1.5e+3] 


epoch 699: avg train loss 1430.46, bar train loss 2.549, len train loss 0.029, col train loss 127.793


Epoch 700: 0batch [00:00, ?batch/s, loss=1.44e+3]

epoch 699: avg test  loss 1456.83, bar  test loss 2.761, len  test loss 0.032, col  test loss 130.274


Epoch 700: 272batch [00:29,  9.17batch/s, loss=1.64e+3]


epoch 700: avg train loss 1430.81, bar train loss 2.575, len train loss 0.028, col train loss 127.796
epoch 700: avg test  loss 1462.14, bar  test loss 2.773, len  test loss 0.031, col  test loss 131.207


Epoch 701: 272batch [00:30,  8.94batch/s, loss=1.37e+3]


epoch 701: avg train loss 1433.04, bar train loss 2.626, len train loss 0.029, col train loss 128.099


Epoch 702: 0batch [00:00, ?batch/s, loss=1.45e+3]

epoch 701: avg test  loss 1472.40, bar  test loss 4.205, len  test loss 0.034, col  test loss 131.078


Epoch 702: 272batch [00:29,  9.15batch/s, loss=1.32e+3]


epoch 702: avg train loss 1432.70, bar train loss 2.639, len train loss 0.029, col train loss 128.051


Epoch 703: 1batch [00:00,  9.90batch/s, loss=1.44e+3]

epoch 702: avg test  loss 1458.54, bar  test loss 2.881, len  test loss 0.032, col  test loss 130.560


Epoch 703: 272batch [00:29,  9.17batch/s, loss=1.38e+3]


epoch 703: avg train loss 1431.77, bar train loss 2.616, len train loss 0.029, col train loss 127.984


Epoch 704: 1batch [00:00,  6.67batch/s, loss=1.4e+3]

epoch 703: avg test  loss 1460.65, bar  test loss 2.786, len  test loss 0.030, col  test loss 130.812


Epoch 704: 272batch [00:29,  9.13batch/s, loss=1.51e+3]


epoch 704: avg train loss 1431.91, bar train loss 2.584, len train loss 0.028, col train loss 127.943


Epoch 705: 0batch [00:00, ?batch/s, loss=1.39e+3]

epoch 704: avg test  loss 1461.71, bar  test loss 2.784, len  test loss 0.033, col  test loss 130.194


Epoch 705: 272batch [00:29,  9.07batch/s, loss=1.4e+3] 


epoch 705: avg train loss 1432.73, bar train loss 2.576, len train loss 0.028, col train loss 128.092
epoch 705: avg test  loss 1461.10, bar  test loss 3.093, len  test loss 0.030, col  test loss 130.502


Epoch 706: 272batch [00:30,  9.05batch/s, loss=1.32e+3]


epoch 706: avg train loss 1432.73, bar train loss 2.636, len train loss 0.028, col train loss 128.085


Epoch 707: 0batch [00:00, ?batch/s, loss=1.4e+3]

epoch 706: avg test  loss 1460.28, bar  test loss 2.701, len  test loss 0.032, col  test loss 130.640


Epoch 707: 272batch [00:29,  9.08batch/s, loss=1.46e+3]


epoch 707: avg train loss 1433.91, bar train loss 2.623, len train loss 0.029, col train loss 128.171


Epoch 708: 0batch [00:00, ?batch/s]

epoch 707: avg test  loss 1464.54, bar  test loss 3.093, len  test loss 0.031, col  test loss 130.851


Epoch 708: 272batch [00:30,  8.92batch/s, loss=1.33e+3]


epoch 708: avg train loss 1433.68, bar train loss 2.637, len train loss 0.030, col train loss 128.199


Epoch 709: 1batch [00:00,  9.35batch/s, loss=1.44e+3]

epoch 708: avg test  loss 1462.16, bar  test loss 2.779, len  test loss 0.051, col  test loss 130.011


Epoch 709: 272batch [00:29,  9.11batch/s, loss=1.55e+3]


epoch 709: avg train loss 1433.30, bar train loss 2.573, len train loss 0.029, col train loss 128.060


Epoch 710: 0batch [00:00, ?batch/s, loss=1.42e+3]

epoch 709: avg test  loss 1463.02, bar  test loss 3.180, len  test loss 0.032, col  test loss 130.477


Epoch 710: 272batch [00:29,  9.12batch/s, loss=1.52e+3]


epoch 710: avg train loss 1435.07, bar train loss 2.653, len train loss 0.029, col train loss 128.412
epoch 710: avg test  loss 1463.54, bar  test loss 2.945, len  test loss 0.033, col  test loss 130.891


Epoch 711: 272batch [00:29,  9.10batch/s, loss=1.39e+3]


epoch 711: avg train loss 1435.64, bar train loss 2.596, len train loss 0.029, col train loss 128.489


Epoch 712: 1batch [00:00,  9.35batch/s, loss=1.35e+3]

epoch 711: avg test  loss 1459.26, bar  test loss 2.795, len  test loss 0.031, col  test loss 131.294


Epoch 712: 272batch [00:29,  9.13batch/s, loss=1.49e+3]


epoch 712: avg train loss 1435.42, bar train loss 2.600, len train loss 0.029, col train loss 128.374


Epoch 713: 1batch [00:00,  9.01batch/s, loss=1.42e+3]

epoch 712: avg test  loss 1463.16, bar  test loss 3.151, len  test loss 0.031, col  test loss 130.747


Epoch 713: 272batch [00:29,  9.09batch/s, loss=1.39e+3]


epoch 713: avg train loss 1435.60, bar train loss 2.632, len train loss 0.029, col train loss 128.381


Epoch 714: 1batch [00:00,  9.62batch/s, loss=1.48e+3]

epoch 713: avg test  loss 1461.35, bar  test loss 3.150, len  test loss 0.036, col  test loss 130.569


Epoch 714: 272batch [00:29,  9.10batch/s, loss=1.4e+3] 


epoch 714: avg train loss 1434.81, bar train loss 2.672, len train loss 0.029, col train loss 128.376


Epoch 715: 1batch [00:00,  9.01batch/s, loss=1.46e+3]

epoch 714: avg test  loss 1461.42, bar  test loss 3.057, len  test loss 0.032, col  test loss 130.720


Epoch 715: 272batch [00:29,  9.07batch/s, loss=1.45e+3]


epoch 715: avg train loss 1435.38, bar train loss 2.616, len train loss 0.029, col train loss 128.444
epoch 715: avg test  loss 1463.33, bar  test loss 2.804, len  test loss 0.033, col  test loss 131.266


Epoch 716: 272batch [00:30,  9.05batch/s, loss=1.52e+3]


epoch 716: avg train loss 1438.64, bar train loss 2.665, len train loss 0.030, col train loss 128.577


Epoch 717: 1batch [00:00,  9.90batch/s, loss=1.47e+3]

epoch 716: avg test  loss 1463.63, bar  test loss 2.932, len  test loss 0.031, col  test loss 131.329


Epoch 717: 272batch [00:29,  9.07batch/s, loss=1.63e+3]


epoch 717: avg train loss 1436.09, bar train loss 2.602, len train loss 0.028, col train loss 128.492


Epoch 718: 1batch [00:00,  9.35batch/s, loss=1.39e+3]

epoch 717: avg test  loss 1463.47, bar  test loss 2.905, len  test loss 0.033, col  test loss 130.865


Epoch 718: 272batch [00:29,  9.07batch/s, loss=1.43e+3]


epoch 718: avg train loss 1437.33, bar train loss 2.629, len train loss 0.029, col train loss 128.502


Epoch 719: 1batch [00:00,  9.43batch/s, loss=1.46e+3]

epoch 718: avg test  loss 1466.91, bar  test loss 3.108, len  test loss 0.033, col  test loss 130.595


Epoch 719: 272batch [00:29,  9.09batch/s, loss=1.4e+3] 


epoch 719: avg train loss 1436.74, bar train loss 2.659, len train loss 0.028, col train loss 128.366


Epoch 720: 1batch [00:00,  9.09batch/s, loss=1.43e+3]

epoch 719: avg test  loss 1462.05, bar  test loss 2.852, len  test loss 0.031, col  test loss 130.578


Epoch 720: 272batch [00:30,  9.00batch/s, loss=1.47e+3]


epoch 720: avg train loss 1436.46, bar train loss 2.643, len train loss 0.029, col train loss 128.466
epoch 720: avg test  loss 1456.40, bar  test loss 2.707, len  test loss 0.032, col  test loss 130.377


Epoch 721: 272batch [00:30,  9.04batch/s, loss=1.5e+3] 


epoch 721: avg train loss 1436.72, bar train loss 2.631, len train loss 0.029, col train loss 128.549


Epoch 722: 1batch [00:00,  9.26batch/s, loss=1.39e+3]

epoch 721: avg test  loss 1461.75, bar  test loss 2.705, len  test loss 0.032, col  test loss 130.705


Epoch 722: 272batch [00:30,  9.03batch/s, loss=1.47e+3]


epoch 722: avg train loss 1438.80, bar train loss 2.635, len train loss 0.030, col train loss 128.514


Epoch 723: 1batch [00:00,  9.90batch/s, loss=1.41e+3]

epoch 722: avg test  loss 1463.88, bar  test loss 2.958, len  test loss 0.033, col  test loss 130.826


Epoch 723: 272batch [00:30,  9.06batch/s, loss=1.37e+3]


epoch 723: avg train loss 1438.65, bar train loss 2.640, len train loss 0.029, col train loss 128.681


Epoch 724: 1batch [00:00,  9.62batch/s, loss=1.44e+3]

epoch 723: avg test  loss 1461.42, bar  test loss 2.854, len  test loss 0.034, col  test loss 131.156


Epoch 724: 272batch [00:30,  9.05batch/s, loss=1.42e+3]


epoch 724: avg train loss 1437.88, bar train loss 2.651, len train loss 0.029, col train loss 128.690


Epoch 725: 1batch [00:00,  9.35batch/s, loss=1.4e+3]

epoch 724: avg test  loss 1463.90, bar  test loss 2.762, len  test loss 0.036, col  test loss 131.411


Epoch 725: 272batch [00:30,  8.98batch/s, loss=1.5e+3] 


epoch 725: avg train loss 1440.56, bar train loss 2.670, len train loss 0.029, col train loss 128.880
epoch 725: avg test  loss 1466.62, bar  test loss 2.993, len  test loss 0.032, col  test loss 131.053


Epoch 726: 272batch [00:30,  8.96batch/s, loss=1.53e+3]


epoch 726: avg train loss 1439.52, bar train loss 2.636, len train loss 0.029, col train loss 128.815


Epoch 727: 1batch [00:00,  8.40batch/s, loss=1.38e+3]

epoch 726: avg test  loss 1467.06, bar  test loss 3.034, len  test loss 0.032, col  test loss 130.433


Epoch 727: 272batch [00:30,  8.85batch/s, loss=1.5e+3] 


epoch 727: avg train loss 1439.67, bar train loss 2.672, len train loss 0.029, col train loss 128.783


Epoch 728: 1batch [00:00,  9.26batch/s, loss=1.51e+3]

epoch 727: avg test  loss 1466.75, bar  test loss 2.880, len  test loss 0.034, col  test loss 132.192


Epoch 728: 272batch [00:30,  9.04batch/s, loss=1.37e+3]


epoch 728: avg train loss 1440.06, bar train loss 2.668, len train loss 0.029, col train loss 128.877


Epoch 729: 0batch [00:00, ?batch/s, loss=1.44e+3]

epoch 728: avg test  loss 1466.33, bar  test loss 3.165, len  test loss 0.030, col  test loss 130.465


Epoch 729: 272batch [00:30,  9.05batch/s, loss=1.49e+3]


epoch 729: avg train loss 1440.92, bar train loss 2.663, len train loss 0.029, col train loss 128.751


Epoch 730: 1batch [00:00,  9.80batch/s, loss=1.44e+3]

epoch 729: avg test  loss 1469.53, bar  test loss 3.205, len  test loss 0.032, col  test loss 131.304


Epoch 730: 272batch [00:30,  8.98batch/s, loss=1.42e+3]


epoch 730: avg train loss 1441.20, bar train loss 2.632, len train loss 0.031, col train loss 128.936
epoch 730: avg test  loss 1471.65, bar  test loss 3.175, len  test loss 0.032, col  test loss 132.040


Epoch 731: 272batch [00:30,  9.01batch/s, loss=1.61e+3]


epoch 731: avg train loss 1440.20, bar train loss 2.685, len train loss 0.029, col train loss 128.928


Epoch 732: 0batch [00:00, ?batch/s, loss=1.46e+3]

epoch 731: avg test  loss 1468.62, bar  test loss 2.742, len  test loss 0.033, col  test loss 130.749


Epoch 732: 272batch [00:30,  9.03batch/s, loss=1.5e+3] 


epoch 732: avg train loss 1442.03, bar train loss 2.701, len train loss 0.030, col train loss 128.827


Epoch 733: 1batch [00:00,  9.35batch/s, loss=1.51e+3]

epoch 732: avg test  loss 1465.26, bar  test loss 2.834, len  test loss 0.032, col  test loss 131.174


Epoch 733: 272batch [00:30,  8.95batch/s, loss=1.47e+3]


epoch 733: avg train loss 1440.48, bar train loss 2.685, len train loss 0.030, col train loss 128.859


Epoch 734: 0batch [00:00, ?batch/s, loss=1.45e+3]

epoch 733: avg test  loss 1468.17, bar  test loss 2.757, len  test loss 0.031, col  test loss 131.326


Epoch 734: 272batch [00:30,  8.99batch/s, loss=1.38e+3]


epoch 734: avg train loss 1441.41, bar train loss 2.693, len train loss 0.029, col train loss 128.882


Epoch 735: 1batch [00:00,  9.52batch/s, loss=1.47e+3]

epoch 734: avg test  loss 1465.93, bar  test loss 2.910, len  test loss 0.032, col  test loss 131.135


Epoch 735: 272batch [00:30,  8.91batch/s, loss=1.52e+3]


epoch 735: avg train loss 1441.08, bar train loss 2.675, len train loss 0.029, col train loss 128.866
epoch 735: avg test  loss 1474.10, bar  test loss 3.625, len  test loss 0.035, col  test loss 131.593


Epoch 736: 272batch [00:30,  8.93batch/s, loss=1.49e+3]


epoch 736: avg train loss 1441.07, bar train loss 2.691, len train loss 0.029, col train loss 128.989


Epoch 737: 1batch [00:00,  9.90batch/s, loss=1.52e+3]

epoch 736: avg test  loss 1464.23, bar  test loss 2.859, len  test loss 0.031, col  test loss 131.265


Epoch 737: 272batch [00:30,  8.99batch/s, loss=1.5e+3] 


epoch 737: avg train loss 1440.30, bar train loss 2.669, len train loss 0.030, col train loss 128.785


Epoch 738: 1batch [00:00,  8.62batch/s, loss=1.43e+3]

epoch 737: avg test  loss 1470.29, bar  test loss 3.029, len  test loss 0.039, col  test loss 131.023


Epoch 738: 272batch [00:30,  8.98batch/s, loss=1.38e+3]


epoch 738: avg train loss 1441.26, bar train loss 2.688, len train loss 0.030, col train loss 128.887


Epoch 739: 0batch [00:00, ?batch/s]

epoch 738: avg test  loss 1462.84, bar  test loss 2.873, len  test loss 0.031, col  test loss 131.361


Epoch 739: 272batch [00:31,  8.76batch/s, loss=1.53e+3]


epoch 739: avg train loss 1443.20, bar train loss 2.695, len train loss 0.030, col train loss 129.025


Epoch 740: 1batch [00:00,  9.62batch/s, loss=1.54e+3]

epoch 739: avg test  loss 1468.63, bar  test loss 2.901, len  test loss 0.032, col  test loss 131.429


Epoch 740: 272batch [00:30,  8.83batch/s, loss=1.55e+3]


epoch 740: avg train loss 1443.02, bar train loss 2.700, len train loss 0.030, col train loss 129.094
epoch 740: avg test  loss 1465.04, bar  test loss 2.823, len  test loss 0.032, col  test loss 131.243


Epoch 741: 272batch [00:30,  8.91batch/s, loss=1.42e+3]


epoch 741: avg train loss 1446.40, bar train loss 2.688, len train loss 0.030, col train loss 129.419


Epoch 742: 1batch [00:00,  9.35batch/s, loss=1.51e+3]

epoch 741: avg test  loss 1466.53, bar  test loss 2.807, len  test loss 0.033, col  test loss 130.926


Epoch 742: 272batch [00:30,  8.93batch/s, loss=1.27e+3]


epoch 742: avg train loss 1444.20, bar train loss 2.696, len train loss 0.030, col train loss 129.353


Epoch 743: 1batch [00:00,  9.90batch/s, loss=1.45e+3]

epoch 742: avg test  loss 1469.74, bar  test loss 3.198, len  test loss 0.032, col  test loss 131.287


Epoch 743: 272batch [00:30,  8.92batch/s, loss=1.38e+3]


epoch 743: avg train loss 1443.58, bar train loss 2.672, len train loss 0.030, col train loss 129.063


Epoch 744: 1batch [00:00,  9.52batch/s, loss=1.43e+3]

epoch 743: avg test  loss 1466.75, bar  test loss 2.854, len  test loss 0.035, col  test loss 131.363


Epoch 744: 272batch [00:30,  8.95batch/s, loss=1.4e+3] 


epoch 744: avg train loss 1446.07, bar train loss 2.707, len train loss 0.031, col train loss 129.467


Epoch 745: 1batch [00:00,  9.35batch/s, loss=1.44e+3]

epoch 744: avg test  loss 1472.84, bar  test loss 3.244, len  test loss 0.034, col  test loss 131.049


Epoch 745: 272batch [00:30,  8.96batch/s, loss=1.46e+3]


epoch 745: avg train loss 1446.41, bar train loss 2.763, len train loss 0.031, col train loss 129.474
epoch 745: avg test  loss 1474.84, bar  test loss 3.013, len  test loss 0.034, col  test loss 132.488


Epoch 746: 272batch [00:30,  8.94batch/s, loss=1.36e+3]


epoch 746: avg train loss 1445.90, bar train loss 2.727, len train loss 0.031, col train loss 129.404


Epoch 747: 1batch [00:00,  9.52batch/s, loss=1.43e+3]

epoch 746: avg test  loss 1473.44, bar  test loss 2.866, len  test loss 0.034, col  test loss 131.974


Epoch 747: 272batch [00:30,  8.92batch/s, loss=1.35e+3]


epoch 747: avg train loss 1445.07, bar train loss 2.674, len train loss 0.030, col train loss 129.291


Epoch 748: 1batch [00:00,  9.80batch/s, loss=1.46e+3]

epoch 747: avg test  loss 1482.97, bar  test loss 3.399, len  test loss 0.032, col  test loss 131.964


Epoch 748: 272batch [00:30,  8.90batch/s, loss=1.36e+3]


epoch 748: avg train loss 1446.89, bar train loss 2.772, len train loss 0.031, col train loss 129.508


Epoch 749: 0batch [00:00, ?batch/s, loss=1.43e+3]

epoch 748: avg test  loss 1468.57, bar  test loss 2.975, len  test loss 0.032, col  test loss 131.428


Epoch 749: 272batch [00:31,  8.77batch/s, loss=1.47e+3]


epoch 749: avg train loss 1444.46, bar train loss 2.679, len train loss 0.029, col train loss 129.177


Epoch 750: 1batch [00:00,  6.90batch/s, loss=1.47e+3]

epoch 749: avg test  loss 1467.44, bar  test loss 2.883, len  test loss 0.033, col  test loss 131.704


Epoch 750: 272batch [00:31,  8.58batch/s, loss=1.47e+3]


epoch 750: avg train loss 1444.31, bar train loss 2.703, len train loss 0.029, col train loss 129.266
epoch 750: avg test  loss 1465.59, bar  test loss 2.808, len  test loss 0.032, col  test loss 131.133


Epoch 751: 272batch [00:30,  8.85batch/s, loss=1.5e+3] 


epoch 751: avg train loss 1444.78, bar train loss 2.723, len train loss 0.030, col train loss 129.223


Epoch 752: 0batch [00:00, ?batch/s, loss=1.44e+3]

epoch 751: avg test  loss 1469.82, bar  test loss 3.183, len  test loss 0.032, col  test loss 131.704


Epoch 752: 272batch [00:32,  8.46batch/s, loss=1.53e+3]


epoch 752: avg train loss 1446.17, bar train loss 2.718, len train loss 0.029, col train loss 129.514


Epoch 753: 0batch [00:00, ?batch/s]

epoch 752: avg test  loss 1473.00, bar  test loss 2.850, len  test loss 0.030, col  test loss 132.187


Epoch 753: 272batch [00:31,  8.73batch/s, loss=1.38e+3]


epoch 753: avg train loss 1447.60, bar train loss 2.765, len train loss 0.030, col train loss 129.668


Epoch 754: 1batch [00:00,  9.35batch/s, loss=1.46e+3]

epoch 753: avg test  loss 1473.26, bar  test loss 2.918, len  test loss 0.035, col  test loss 132.538


Epoch 754: 272batch [00:31,  8.77batch/s, loss=1.36e+3]


epoch 754: avg train loss 1447.13, bar train loss 2.755, len train loss 0.031, col train loss 129.576


Epoch 755: 1batch [00:00,  8.85batch/s, loss=1.44e+3]

epoch 754: avg test  loss 1471.45, bar  test loss 2.992, len  test loss 0.036, col  test loss 132.504


Epoch 755: 272batch [00:31,  8.73batch/s, loss=1.39e+3]


epoch 755: avg train loss 1446.34, bar train loss 2.742, len train loss 0.031, col train loss 129.416
epoch 755: avg test  loss 1468.62, bar  test loss 2.889, len  test loss 0.033, col  test loss 132.017


Epoch 756: 272batch [00:30,  8.85batch/s, loss=1.4e+3] 


epoch 756: avg train loss 1448.31, bar train loss 2.752, len train loss 0.031, col train loss 129.679


Epoch 757: 1batch [00:00,  9.35batch/s, loss=1.42e+3]

epoch 756: avg test  loss 1470.29, bar  test loss 3.027, len  test loss 0.033, col  test loss 130.987


Epoch 757: 272batch [00:30,  8.83batch/s, loss=1.51e+3]


epoch 757: avg train loss 1448.61, bar train loss 2.755, len train loss 0.030, col train loss 129.719


Epoch 758: 1batch [00:00,  9.71batch/s, loss=1.41e+3]

epoch 757: avg test  loss 1471.64, bar  test loss 3.198, len  test loss 0.033, col  test loss 132.220


Epoch 758: 272batch [00:30,  8.86batch/s, loss=1.46e+3]


epoch 758: avg train loss 1447.64, bar train loss 2.743, len train loss 0.030, col train loss 129.634


Epoch 759: 1batch [00:00,  9.35batch/s, loss=1.44e+3]

epoch 758: avg test  loss 1473.24, bar  test loss 2.834, len  test loss 0.031, col  test loss 131.402


Epoch 759: 272batch [00:30,  8.87batch/s, loss=1.57e+3]


epoch 759: avg train loss 1447.70, bar train loss 2.690, len train loss 0.030, col train loss 129.663


Epoch 760: 1batch [00:00,  9.62batch/s, loss=1.4e+3]

epoch 759: avg test  loss 1467.17, bar  test loss 3.011, len  test loss 0.032, col  test loss 131.426


Epoch 760: 272batch [00:30,  8.83batch/s, loss=1.57e+3]


epoch 760: avg train loss 1447.97, bar train loss 2.736, len train loss 0.030, col train loss 129.558
epoch 760: avg test  loss 1469.89, bar  test loss 2.958, len  test loss 0.033, col  test loss 132.261


Epoch 761: 272batch [00:30,  8.80batch/s, loss=1.51e+3]


epoch 761: avg train loss 1447.68, bar train loss 2.699, len train loss 0.030, col train loss 129.678


Epoch 762: 1batch [00:00, 10.00batch/s, loss=1.46e+3]

epoch 761: avg test  loss 1475.67, bar  test loss 3.111, len  test loss 0.036, col  test loss 132.678


Epoch 762: 272batch [00:30,  8.86batch/s, loss=1.55e+3]


epoch 762: avg train loss 1448.25, bar train loss 2.733, len train loss 0.031, col train loss 129.612


Epoch 763: 1batch [00:00,  9.43batch/s, loss=1.5e+3]

epoch 762: avg test  loss 1465.55, bar  test loss 2.765, len  test loss 0.034, col  test loss 131.281


Epoch 763: 272batch [00:31,  8.71batch/s, loss=1.39e+3]


epoch 763: avg train loss 1449.11, bar train loss 2.731, len train loss 0.030, col train loss 129.800


Epoch 764: 1batch [00:00,  9.43batch/s, loss=1.5e+3]

epoch 763: avg test  loss 1468.40, bar  test loss 2.831, len  test loss 0.034, col  test loss 131.913


Epoch 764: 272batch [00:32,  8.49batch/s, loss=1.36e+3]


epoch 764: avg train loss 1451.10, bar train loss 2.790, len train loss 0.030, col train loss 129.804


Epoch 765: 1batch [00:00,  9.18batch/s, loss=1.43e+3]

epoch 764: avg test  loss 1474.19, bar  test loss 2.862, len  test loss 0.034, col  test loss 132.214


Epoch 765: 272batch [00:31,  8.59batch/s, loss=1.42e+3]


epoch 765: avg train loss 1451.28, bar train loss 2.701, len train loss 0.030, col train loss 129.853
epoch 765: avg test  loss 1473.74, bar  test loss 2.936, len  test loss 0.033, col  test loss 132.026


Epoch 766: 272batch [00:31,  8.69batch/s, loss=1.48e+3]


epoch 766: avg train loss 1452.38, bar train loss 2.732, len train loss 0.032, col train loss 129.970


Epoch 767: 1batch [00:00,  8.77batch/s, loss=1.45e+3]

epoch 766: avg test  loss 1473.13, bar  test loss 2.875, len  test loss 0.034, col  test loss 131.726


Epoch 767: 272batch [00:30,  8.82batch/s, loss=1.5e+3] 


epoch 767: avg train loss 1452.65, bar train loss 2.792, len train loss 0.030, col train loss 130.000


Epoch 768: 1batch [00:00,  9.62batch/s, loss=1.54e+3]

epoch 767: avg test  loss 1479.25, bar  test loss 3.234, len  test loss 0.033, col  test loss 132.417


Epoch 768: 272batch [00:30,  8.81batch/s, loss=1.41e+3]


epoch 768: avg train loss 1451.35, bar train loss 2.719, len train loss 0.031, col train loss 129.926


Epoch 769: 1batch [00:00,  9.26batch/s, loss=1.39e+3]

epoch 768: avg test  loss 1478.44, bar  test loss 3.265, len  test loss 0.033, col  test loss 131.971


Epoch 769: 272batch [00:30,  8.81batch/s, loss=1.37e+3]


epoch 769: avg train loss 1453.57, bar train loss 2.798, len train loss 0.031, col train loss 130.123


Epoch 770: 1batch [00:00,  8.70batch/s, loss=1.48e+3]

epoch 769: avg test  loss 1470.97, bar  test loss 2.822, len  test loss 0.033, col  test loss 131.865


Epoch 770: 272batch [00:30,  8.82batch/s, loss=1.52e+3]


epoch 770: avg train loss 1451.33, bar train loss 2.724, len train loss 0.031, col train loss 129.925
epoch 770: avg test  loss 1474.80, bar  test loss 2.788, len  test loss 0.033, col  test loss 132.681


Epoch 771: 272batch [00:31,  8.68batch/s, loss=1.41e+3]


epoch 771: avg train loss 1453.44, bar train loss 2.778, len train loss 0.031, col train loss 130.119


Epoch 772: 1batch [00:00,  9.35batch/s, loss=1.47e+3]

epoch 771: avg test  loss 1482.46, bar  test loss 3.429, len  test loss 0.035, col  test loss 132.555


Epoch 772: 272batch [00:31,  8.71batch/s, loss=1.38e+3]


epoch 772: avg train loss 1452.58, bar train loss 2.740, len train loss 0.031, col train loss 130.095


Epoch 773: 1batch [00:00,  9.26batch/s, loss=1.36e+3]

epoch 772: avg test  loss 1474.70, bar  test loss 2.862, len  test loss 0.034, col  test loss 131.830


Epoch 773: 272batch [00:31,  8.69batch/s, loss=1.41e+3]


epoch 773: avg train loss 1450.57, bar train loss 2.749, len train loss 0.030, col train loss 129.979


Epoch 774: 1batch [00:00,  9.26batch/s, loss=1.44e+3]

epoch 773: avg test  loss 1475.11, bar  test loss 2.870, len  test loss 0.034, col  test loss 132.233


Epoch 774: 272batch [00:32,  8.37batch/s, loss=1.4e+3] 


epoch 774: avg train loss 1453.47, bar train loss 2.841, len train loss 0.030, col train loss 130.029


Epoch 775: 1batch [00:00,  8.33batch/s, loss=1.42e+3]

epoch 774: avg test  loss 1477.27, bar  test loss 3.187, len  test loss 0.033, col  test loss 131.360


Epoch 775: 272batch [00:31,  8.56batch/s, loss=1.36e+3]


epoch 775: avg train loss 1452.01, bar train loss 2.727, len train loss 0.030, col train loss 130.003
epoch 775: avg test  loss 1478.47, bar  test loss 2.804, len  test loss 0.035, col  test loss 132.651


Epoch 776: 272batch [00:30,  8.79batch/s, loss=1.45e+3]


epoch 776: avg train loss 1453.85, bar train loss 2.725, len train loss 0.030, col train loss 130.303


Epoch 777: 1batch [00:00,  9.35batch/s, loss=1.48e+3]

epoch 776: avg test  loss 1476.22, bar  test loss 2.885, len  test loss 0.034, col  test loss 132.388


Epoch 777: 272batch [00:31,  8.57batch/s, loss=1.45e+3]


epoch 777: avg train loss 1454.11, bar train loss 2.775, len train loss 0.030, col train loss 130.220


Epoch 778: 1batch [00:00,  8.77batch/s, loss=1.5e+3]

epoch 777: avg test  loss 1474.95, bar  test loss 2.816, len  test loss 0.036, col  test loss 132.193


Epoch 778: 272batch [00:31,  8.62batch/s, loss=1.48e+3]


epoch 778: avg train loss 1456.07, bar train loss 2.795, len train loss 0.033, col train loss 130.615


Epoch 779: 1batch [00:00,  9.17batch/s, loss=1.54e+3]

epoch 778: avg test  loss 1478.33, bar  test loss 3.296, len  test loss 0.032, col  test loss 132.565


Epoch 779: 272batch [00:31,  8.77batch/s, loss=1.56e+3]


epoch 779: avg train loss 1452.61, bar train loss 2.766, len train loss 0.029, col train loss 130.147


Epoch 780: 1batch [00:00,  9.80batch/s, loss=1.5e+3]

epoch 779: avg test  loss 1475.60, bar  test loss 2.870, len  test loss 0.031, col  test loss 132.113


Epoch 780: 272batch [00:31,  8.71batch/s, loss=1.42e+3]


epoch 780: avg train loss 1454.66, bar train loss 2.791, len train loss 0.030, col train loss 130.227
epoch 780: avg test  loss 1475.63, bar  test loss 2.845, len  test loss 0.035, col  test loss 132.349


Epoch 781: 272batch [00:31,  8.67batch/s, loss=1.54e+3]


epoch 781: avg train loss 1452.61, bar train loss 2.761, len train loss 0.030, col train loss 130.049


Epoch 782: 1batch [00:00, 10.00batch/s, loss=1.44e+3]

epoch 781: avg test  loss 1475.16, bar  test loss 2.906, len  test loss 0.032, col  test loss 131.980


Epoch 782: 272batch [00:31,  8.75batch/s, loss=1.53e+3]


epoch 782: avg train loss 1456.39, bar train loss 2.781, len train loss 0.031, col train loss 130.549


Epoch 783: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 782: avg test  loss 1477.67, bar  test loss 2.949, len  test loss 0.032, col  test loss 132.962


Epoch 783: 272batch [00:31,  8.72batch/s, loss=1.47e+3]


epoch 783: avg train loss 1455.98, bar train loss 2.741, len train loss 0.030, col train loss 130.412


Epoch 784: 1batch [00:00,  9.52batch/s, loss=1.46e+3]

epoch 783: avg test  loss 1478.54, bar  test loss 2.896, len  test loss 0.034, col  test loss 132.341


Epoch 784: 272batch [00:31,  8.71batch/s, loss=1.44e+3]


epoch 784: avg train loss 1457.26, bar train loss 2.758, len train loss 0.031, col train loss 130.525


Epoch 785: 1batch [00:00,  9.70batch/s, loss=1.4e+3]

epoch 784: avg test  loss 1479.35, bar  test loss 2.954, len  test loss 0.035, col  test loss 132.491


Epoch 785: 272batch [00:31,  8.76batch/s, loss=1.43e+3]


epoch 785: avg train loss 1456.45, bar train loss 2.819, len train loss 0.032, col train loss 130.659
epoch 785: avg test  loss 1481.05, bar  test loss 2.960, len  test loss 0.032, col  test loss 133.146


Epoch 786: 272batch [00:31,  8.50batch/s, loss=1.37e+3]


epoch 786: avg train loss 1454.75, bar train loss 2.781, len train loss 0.031, col train loss 130.201


Epoch 787: 1batch [00:00,  9.35batch/s, loss=1.41e+3]

epoch 786: avg test  loss 1481.65, bar  test loss 3.330, len  test loss 0.034, col  test loss 131.473


Epoch 787: 272batch [00:31,  8.63batch/s, loss=1.5e+3] 


epoch 787: avg train loss 1454.05, bar train loss 2.768, len train loss 0.031, col train loss 130.284


Epoch 788: 1batch [00:00,  9.43batch/s, loss=1.44e+3]

epoch 787: avg test  loss 1474.99, bar  test loss 2.864, len  test loss 0.034, col  test loss 132.447


Epoch 788: 272batch [00:31,  8.70batch/s, loss=1.46e+3]


epoch 788: avg train loss 1453.63, bar train loss 2.772, len train loss 0.031, col train loss 130.177


Epoch 789: 1batch [00:00,  9.01batch/s, loss=1.48e+3]

epoch 788: avg test  loss 1483.19, bar  test loss 3.490, len  test loss 0.034, col  test loss 132.581


Epoch 789: 272batch [00:31,  8.65batch/s, loss=1.56e+3]


epoch 789: avg train loss 1455.56, bar train loss 2.848, len train loss 0.031, col train loss 130.303


Epoch 790: 1batch [00:00,  9.35batch/s, loss=1.47e+3]

epoch 789: avg test  loss 1477.78, bar  test loss 3.059, len  test loss 0.033, col  test loss 132.348


Epoch 790: 272batch [00:31,  8.68batch/s, loss=1.57e+3]


epoch 790: avg train loss 1456.41, bar train loss 2.790, len train loss 0.031, col train loss 130.468
epoch 790: avg test  loss 1484.38, bar  test loss 3.137, len  test loss 0.038, col  test loss 132.942


Epoch 791: 272batch [00:31,  8.68batch/s, loss=1.35e+3]


epoch 791: avg train loss 1458.40, bar train loss 2.808, len train loss 0.031, col train loss 130.644


Epoch 792: 1batch [00:00,  9.17batch/s, loss=1.42e+3]

epoch 791: avg test  loss 1478.23, bar  test loss 3.054, len  test loss 0.033, col  test loss 133.057


Epoch 792: 272batch [00:31,  8.70batch/s, loss=1.33e+3]


epoch 792: avg train loss 1455.15, bar train loss 2.798, len train loss 0.031, col train loss 130.453


Epoch 793: 1batch [00:00,  9.26batch/s, loss=1.48e+3]

epoch 792: avg test  loss 1501.51, bar  test loss 4.625, len  test loss 0.034, col  test loss 133.076


Epoch 793: 272batch [00:31,  8.71batch/s, loss=1.44e+3]


epoch 793: avg train loss 1457.68, bar train loss 3.022, len train loss 0.030, col train loss 130.620


Epoch 794: 1batch [00:00,  8.70batch/s, loss=1.41e+3]

epoch 793: avg test  loss 1480.73, bar  test loss 2.977, len  test loss 0.038, col  test loss 132.569


Epoch 794: 272batch [00:31,  8.69batch/s, loss=1.53e+3]


epoch 794: avg train loss 1459.24, bar train loss 2.796, len train loss 0.032, col train loss 130.684


Epoch 795: 1batch [00:00,  9.62batch/s, loss=1.45e+3]

epoch 794: avg test  loss 1481.52, bar  test loss 3.384, len  test loss 0.033, col  test loss 132.493


Epoch 795: 272batch [00:31,  8.67batch/s, loss=1.51e+3]


epoch 795: avg train loss 1457.93, bar train loss 2.731, len train loss 0.030, col train loss 130.580
epoch 795: avg test  loss 1479.90, bar  test loss 3.062, len  test loss 0.032, col  test loss 133.020


Epoch 796: 272batch [00:31,  8.67batch/s, loss=1.43e+3]


epoch 796: avg train loss 1457.18, bar train loss 2.763, len train loss 0.032, col train loss 130.669


Epoch 797: 1batch [00:00,  9.62batch/s, loss=1.52e+3]

epoch 796: avg test  loss 1479.12, bar  test loss 3.098, len  test loss 0.034, col  test loss 132.545


Epoch 797: 272batch [00:31,  8.57batch/s, loss=1.64e+3]


epoch 797: avg train loss 1457.21, bar train loss 2.826, len train loss 0.030, col train loss 130.620


Epoch 798: 1batch [00:00,  9.52batch/s, loss=1.41e+3]

epoch 797: avg test  loss 1484.76, bar  test loss 3.166, len  test loss 0.032, col  test loss 132.745


Epoch 798: 272batch [00:33,  8.12batch/s, loss=1.49e+3]


epoch 798: avg train loss 1458.71, bar train loss 2.826, len train loss 0.031, col train loss 130.644


Epoch 799: 1batch [00:00,  8.85batch/s, loss=1.44e+3]

epoch 798: avg test  loss 1482.19, bar  test loss 3.204, len  test loss 0.035, col  test loss 133.019


Epoch 799: 272batch [00:31,  8.57batch/s, loss=1.57e+3]


epoch 799: avg train loss 1457.44, bar train loss 2.827, len train loss 0.032, col train loss 130.668


Epoch 800: 1batch [00:00,  8.70batch/s, loss=1.43e+3]

epoch 799: avg test  loss 1475.38, bar  test loss 3.065, len  test loss 0.034, col  test loss 132.268


Epoch 800: 272batch [00:31,  8.63batch/s, loss=1.45e+3]


epoch 800: avg train loss 1458.21, bar train loss 2.810, len train loss 0.031, col train loss 130.703
epoch 800: avg test  loss 1479.09, bar  test loss 3.021, len  test loss 0.035, col  test loss 133.192


Epoch 801: 272batch [00:31,  8.64batch/s, loss=1.43e+3]


epoch 801: avg train loss 1459.15, bar train loss 2.862, len train loss 0.033, col train loss 130.788


Epoch 802: 1batch [00:00,  8.77batch/s, loss=1.43e+3]

epoch 801: avg test  loss 1483.35, bar  test loss 3.117, len  test loss 0.035, col  test loss 132.938


Epoch 802: 272batch [00:31,  8.65batch/s, loss=1.41e+3]


epoch 802: avg train loss 1457.72, bar train loss 2.816, len train loss 0.032, col train loss 130.637


Epoch 803: 1batch [00:00,  8.55batch/s, loss=1.46e+3]

epoch 802: avg test  loss 1481.21, bar  test loss 3.123, len  test loss 0.034, col  test loss 133.025


Epoch 803: 272batch [00:31,  8.64batch/s, loss=1.45e+3]


epoch 803: avg train loss 1458.02, bar train loss 2.801, len train loss 0.031, col train loss 130.744


Epoch 804: 1batch [00:00,  9.35batch/s, loss=1.43e+3]

epoch 803: avg test  loss 1484.80, bar  test loss 2.982, len  test loss 0.035, col  test loss 133.931


Epoch 804: 272batch [00:31,  8.61batch/s, loss=1.47e+3]


epoch 804: avg train loss 1461.86, bar train loss 2.877, len train loss 0.032, col train loss 130.949


Epoch 805: 1batch [00:00,  9.35batch/s, loss=1.46e+3]

epoch 804: avg test  loss 1494.43, bar  test loss 4.321, len  test loss 0.033, col  test loss 132.808


Epoch 805: 272batch [00:31,  8.57batch/s, loss=1.45e+3]


epoch 805: avg train loss 1459.91, bar train loss 2.879, len train loss 0.030, col train loss 130.745
epoch 805: avg test  loss 1484.47, bar  test loss 3.243, len  test loss 0.034, col  test loss 133.468


Epoch 806: 272batch [00:32,  8.49batch/s, loss=1.45e+3]


epoch 806: avg train loss 1457.26, bar train loss 2.824, len train loss 0.030, col train loss 130.687


Epoch 807: 1batch [00:00,  9.26batch/s, loss=1.46e+3]

epoch 806: avg test  loss 1486.72, bar  test loss 3.125, len  test loss 0.036, col  test loss 134.045


Epoch 807: 272batch [00:32,  8.49batch/s, loss=1.4e+3] 


epoch 807: avg train loss 1459.16, bar train loss 2.813, len train loss 0.031, col train loss 130.496


Epoch 808: 1batch [00:00,  9.17batch/s, loss=1.44e+3]

epoch 807: avg test  loss 1480.99, bar  test loss 3.078, len  test loss 0.036, col  test loss 132.803


Epoch 808: 272batch [00:31,  8.55batch/s, loss=1.34e+3]


epoch 808: avg train loss 1459.54, bar train loss 2.847, len train loss 0.030, col train loss 130.758


Epoch 809: 1batch [00:00,  8.85batch/s, loss=1.51e+3]

epoch 808: avg test  loss 1482.06, bar  test loss 3.015, len  test loss 0.033, col  test loss 133.284


Epoch 809: 272batch [00:31,  8.55batch/s, loss=1.6e+3] 


epoch 809: avg train loss 1464.03, bar train loss 2.878, len train loss 0.032, col train loss 131.139


Epoch 810: 1batch [00:00,  9.90batch/s, loss=1.48e+3]

epoch 809: avg test  loss 1487.70, bar  test loss 3.449, len  test loss 0.038, col  test loss 133.242


Epoch 810: 272batch [00:31,  8.61batch/s, loss=1.45e+3]


epoch 810: avg train loss 1461.84, bar train loss 2.824, len train loss 0.031, col train loss 131.119
epoch 810: avg test  loss 1487.02, bar  test loss 2.966, len  test loss 0.037, col  test loss 133.409


Epoch 811: 272batch [00:31,  8.60batch/s, loss=1.48e+3]


epoch 811: avg train loss 1462.95, bar train loss 2.839, len train loss 0.031, col train loss 131.290


Epoch 812: 1batch [00:00,  9.35batch/s, loss=1.48e+3]

epoch 811: avg test  loss 1480.49, bar  test loss 3.029, len  test loss 0.031, col  test loss 132.457


Epoch 812: 272batch [00:31,  8.56batch/s, loss=1.65e+3]


epoch 812: avg train loss 1464.98, bar train loss 2.813, len train loss 0.031, col train loss 131.388


Epoch 813: 1batch [00:00,  9.01batch/s, loss=1.55e+3]

epoch 812: avg test  loss 1484.78, bar  test loss 3.069, len  test loss 0.037, col  test loss 132.611


Epoch 813: 272batch [00:31,  8.51batch/s, loss=1.44e+3]


epoch 813: avg train loss 1466.01, bar train loss 2.916, len train loss 0.032, col train loss 131.514


Epoch 814: 1batch [00:00,  9.35batch/s, loss=1.46e+3]

epoch 813: avg test  loss 1483.73, bar  test loss 2.911, len  test loss 0.034, col  test loss 133.180


Epoch 814: 272batch [00:31,  8.59batch/s, loss=1.71e+3]


epoch 814: avg train loss 1462.01, bar train loss 2.764, len train loss 0.031, col train loss 131.069


Epoch 815: 1batch [00:00,  9.01batch/s, loss=1.43e+3]

epoch 814: avg test  loss 1487.42, bar  test loss 3.396, len  test loss 0.035, col  test loss 133.100


Epoch 815: 272batch [00:31,  8.59batch/s, loss=1.61e+3]


epoch 815: avg train loss 1461.44, bar train loss 2.838, len train loss 0.031, col train loss 130.955
epoch 815: avg test  loss 1484.84, bar  test loss 2.948, len  test loss 0.034, col  test loss 133.227


Epoch 816: 272batch [00:31,  8.56batch/s, loss=1.6e+3] 


epoch 816: avg train loss 1462.28, bar train loss 2.821, len train loss 0.031, col train loss 131.103


Epoch 817: 1batch [00:00,  9.43batch/s, loss=1.54e+3]

epoch 816: avg test  loss 1494.32, bar  test loss 4.047, len  test loss 0.032, col  test loss 133.026


Epoch 817: 272batch [00:31,  8.60batch/s, loss=1.56e+3]


epoch 817: avg train loss 1463.77, bar train loss 2.904, len train loss 0.030, col train loss 131.259


Epoch 818: 1batch [00:00,  9.62batch/s, loss=1.49e+3]

epoch 817: avg test  loss 1484.92, bar  test loss 2.971, len  test loss 0.032, col  test loss 133.035


Epoch 818: 272batch [00:31,  8.62batch/s, loss=1.34e+3]


epoch 818: avg train loss 1462.47, bar train loss 2.856, len train loss 0.031, col train loss 131.240


Epoch 819: 1batch [00:00,  8.93batch/s, loss=1.4e+3]

epoch 818: avg test  loss 1477.76, bar  test loss 2.967, len  test loss 0.034, col  test loss 132.910


Epoch 819: 272batch [00:31,  8.55batch/s, loss=1.58e+3]


epoch 819: avg train loss 1463.90, bar train loss 2.915, len train loss 0.032, col train loss 131.245


Epoch 820: 1batch [00:00,  9.26batch/s, loss=1.5e+3]

epoch 819: avg test  loss 1495.22, bar  test loss 3.084, len  test loss 0.033, col  test loss 134.211


Epoch 820: 272batch [00:31,  8.56batch/s, loss=1.57e+3]


epoch 820: avg train loss 1466.57, bar train loss 2.861, len train loss 0.032, col train loss 131.436
epoch 820: avg test  loss 1491.05, bar  test loss 3.306, len  test loss 0.036, col  test loss 133.281


Epoch 821: 272batch [00:31,  8.53batch/s, loss=1.5e+3] 


epoch 821: avg train loss 1464.87, bar train loss 2.933, len train loss 0.031, col train loss 131.205


Epoch 822: 1batch [00:00,  9.52batch/s, loss=1.41e+3]

epoch 821: avg test  loss 1489.87, bar  test loss 3.310, len  test loss 0.033, col  test loss 133.657


Epoch 822: 272batch [00:32,  8.49batch/s, loss=1.5e+3] 


epoch 822: avg train loss 1466.23, bar train loss 2.929, len train loss 0.031, col train loss 131.494


Epoch 823: 1batch [00:00,  9.62batch/s, loss=1.48e+3]

epoch 822: avg test  loss 1487.97, bar  test loss 3.164, len  test loss 0.035, col  test loss 134.630


Epoch 823: 272batch [00:32,  8.30batch/s, loss=1.42e+3]


epoch 823: avg train loss 1464.57, bar train loss 2.826, len train loss 0.031, col train loss 131.428


Epoch 824: 1batch [00:00,  9.43batch/s, loss=1.44e+3]

epoch 823: avg test  loss 1484.94, bar  test loss 3.299, len  test loss 0.033, col  test loss 133.231


Epoch 824: 272batch [00:32,  8.34batch/s, loss=1.5e+3] 


epoch 824: avg train loss 1463.34, bar train loss 2.882, len train loss 0.031, col train loss 131.268


Epoch 825: 1batch [00:00,  8.77batch/s, loss=1.46e+3]

epoch 824: avg test  loss 1487.51, bar  test loss 2.900, len  test loss 0.034, col  test loss 133.144


Epoch 825: 272batch [00:32,  8.36batch/s, loss=1.52e+3]


epoch 825: avg train loss 1465.22, bar train loss 2.815, len train loss 0.031, col train loss 131.379
epoch 825: avg test  loss 1482.61, bar  test loss 3.021, len  test loss 0.034, col  test loss 132.915


Epoch 826: 272batch [00:32,  8.46batch/s, loss=1.44e+3]


epoch 826: avg train loss 1465.85, bar train loss 2.964, len train loss 0.032, col train loss 131.117


Epoch 827: 1batch [00:00,  9.01batch/s, loss=1.47e+3]

epoch 826: avg test  loss 1486.79, bar  test loss 3.201, len  test loss 0.034, col  test loss 133.711


Epoch 827: 272batch [00:31,  8.53batch/s, loss=1.44e+3]


epoch 827: avg train loss 1467.27, bar train loss 2.871, len train loss 0.032, col train loss 131.525


Epoch 828: 1batch [00:00,  8.93batch/s, loss=1.47e+3]

epoch 827: avg test  loss 1487.12, bar  test loss 3.238, len  test loss 0.033, col  test loss 133.244


Epoch 828: 272batch [00:31,  8.51batch/s, loss=1.37e+3]


epoch 828: avg train loss 1465.91, bar train loss 2.912, len train loss 0.032, col train loss 131.225


Epoch 829: 1batch [00:00,  8.93batch/s, loss=1.48e+3]

epoch 828: avg test  loss 1486.41, bar  test loss 2.902, len  test loss 0.041, col  test loss 133.151


Epoch 829: 272batch [00:32,  8.43batch/s, loss=1.45e+3]


epoch 829: avg train loss 1467.59, bar train loss 2.873, len train loss 0.031, col train loss 131.426


Epoch 830: 1batch [00:00,  8.85batch/s, loss=1.46e+3]

epoch 829: avg test  loss 1499.43, bar  test loss 3.839, len  test loss 0.033, col  test loss 133.231


Epoch 830: 272batch [00:31,  8.53batch/s, loss=1.33e+3]


epoch 830: avg train loss 1467.66, bar train loss 2.975, len train loss 0.033, col train loss 131.462
epoch 830: avg test  loss 1491.90, bar  test loss 3.511, len  test loss 0.035, col  test loss 133.138


Epoch 831: 272batch [00:32,  8.49batch/s, loss=1.55e+3]


epoch 831: avg train loss 1468.09, bar train loss 2.946, len train loss 0.032, col train loss 131.637


Epoch 832: 1batch [00:00,  8.70batch/s, loss=1.49e+3]

epoch 831: avg test  loss 1488.81, bar  test loss 2.972, len  test loss 0.034, col  test loss 134.006


Epoch 832: 272batch [00:32,  8.31batch/s, loss=1.52e+3]


epoch 832: avg train loss 1465.98, bar train loss 2.912, len train loss 0.031, col train loss 131.392


Epoch 833: 1batch [00:00,  9.71batch/s, loss=1.52e+3]

epoch 832: avg test  loss 1498.22, bar  test loss 4.252, len  test loss 0.032, col  test loss 133.706


Epoch 833: 272batch [00:31,  8.53batch/s, loss=1.57e+3]


epoch 833: avg train loss 1466.97, bar train loss 2.883, len train loss 0.031, col train loss 131.418


Epoch 834: 1batch [00:00,  8.00batch/s, loss=1.46e+3]

epoch 833: avg test  loss 1496.78, bar  test loss 3.378, len  test loss 0.035, col  test loss 132.696


Epoch 834: 272batch [00:32,  8.47batch/s, loss=1.39e+3]


epoch 834: avg train loss 1466.54, bar train loss 2.919, len train loss 0.031, col train loss 131.468


Epoch 835: 1batch [00:00,  9.80batch/s, loss=1.42e+3]

epoch 834: avg test  loss 1488.86, bar  test loss 3.167, len  test loss 0.036, col  test loss 133.814


Epoch 835: 272batch [00:31,  8.53batch/s, loss=1.42e+3]


epoch 835: avg train loss 1467.69, bar train loss 2.933, len train loss 0.031, col train loss 131.590
epoch 835: avg test  loss 1489.52, bar  test loss 3.059, len  test loss 0.033, col  test loss 133.709


Epoch 836: 272batch [00:32,  8.43batch/s, loss=1.36e+3]


epoch 836: avg train loss 1470.38, bar train loss 2.979, len train loss 0.034, col train loss 131.726


Epoch 837: 1batch [00:00,  9.17batch/s, loss=1.42e+3]

epoch 836: avg test  loss 1489.32, bar  test loss 3.426, len  test loss 0.033, col  test loss 133.560


Epoch 837: 272batch [00:32,  8.46batch/s, loss=1.45e+3]


epoch 837: avg train loss 1468.29, bar train loss 2.896, len train loss 0.031, col train loss 131.665


Epoch 838: 1batch [00:00,  9.09batch/s, loss=1.44e+3]

epoch 837: avg test  loss 1486.75, bar  test loss 3.158, len  test loss 0.034, col  test loss 132.421


Epoch 838: 272batch [00:32,  8.44batch/s, loss=1.52e+3]


epoch 838: avg train loss 1465.73, bar train loss 2.876, len train loss 0.031, col train loss 131.401


Epoch 839: 1batch [00:00,  8.55batch/s, loss=1.44e+3]

epoch 838: avg test  loss 1487.46, bar  test loss 3.475, len  test loss 0.036, col  test loss 133.061


Epoch 839: 272batch [00:32,  8.47batch/s, loss=1.45e+3]


epoch 839: avg train loss 1467.33, bar train loss 2.903, len train loss 0.032, col train loss 131.635


Epoch 840: 1batch [00:00,  8.77batch/s, loss=1.54e+3]

epoch 839: avg test  loss 1492.83, bar  test loss 3.413, len  test loss 0.033, col  test loss 133.995


Epoch 840: 272batch [00:32,  8.42batch/s, loss=1.64e+3]


epoch 840: avg train loss 1468.19, bar train loss 2.906, len train loss 0.032, col train loss 131.600
epoch 840: avg test  loss 1492.34, bar  test loss 3.388, len  test loss 0.034, col  test loss 133.912


Epoch 841: 272batch [00:32,  8.40batch/s, loss=1.82e+3]


epoch 841: avg train loss 1470.02, bar train loss 2.960, len train loss 0.031, col train loss 131.813


Epoch 842: 1batch [00:00,  9.71batch/s, loss=1.51e+3]

epoch 841: avg test  loss 1487.55, bar  test loss 3.192, len  test loss 0.033, col  test loss 133.930


Epoch 842: 272batch [00:32,  8.40batch/s, loss=1.47e+3]


epoch 842: avg train loss 1469.41, bar train loss 2.909, len train loss 0.031, col train loss 131.755


Epoch 843: 1batch [00:00,  7.94batch/s, loss=1.42e+3]

epoch 842: avg test  loss 1490.87, bar  test loss 3.067, len  test loss 0.036, col  test loss 134.087


Epoch 843: 272batch [00:32,  8.38batch/s, loss=1.38e+3]


epoch 843: avg train loss 1468.17, bar train loss 2.873, len train loss 0.031, col train loss 131.598


Epoch 844: 1batch [00:00,  8.33batch/s, loss=1.4e+3]

epoch 843: avg test  loss 1491.68, bar  test loss 3.348, len  test loss 0.035, col  test loss 133.831


Epoch 844: 272batch [00:32,  8.36batch/s, loss=1.36e+3]


epoch 844: avg train loss 1469.32, bar train loss 2.904, len train loss 0.032, col train loss 131.749


Epoch 845: 1batch [00:00,  9.35batch/s, loss=1.42e+3]

epoch 844: avg test  loss 1493.38, bar  test loss 3.065, len  test loss 0.038, col  test loss 134.503


Epoch 845: 272batch [00:32,  8.33batch/s, loss=1.41e+3]


epoch 845: avg train loss 1472.53, bar train loss 3.031, len train loss 0.032, col train loss 132.047
epoch 845: avg test  loss 1489.14, bar  test loss 2.967, len  test loss 0.032, col  test loss 133.915


Epoch 846: 272batch [00:33,  8.24batch/s, loss=1.41e+3]


epoch 846: avg train loss 1470.26, bar train loss 2.930, len train loss 0.032, col train loss 131.899


Epoch 847: 1batch [00:00,  9.26batch/s, loss=1.52e+3]

epoch 846: avg test  loss 1502.82, bar  test loss 4.350, len  test loss 0.036, col  test loss 134.077


Epoch 847: 272batch [00:32,  8.28batch/s, loss=1.53e+3]


epoch 847: avg train loss 1471.80, bar train loss 2.958, len train loss 0.032, col train loss 132.144


Epoch 848: 1batch [00:00,  8.47batch/s, loss=1.44e+3]

epoch 847: avg test  loss 1490.84, bar  test loss 3.207, len  test loss 0.037, col  test loss 134.012


Epoch 848: 272batch [00:32,  8.37batch/s, loss=1.46e+3]


epoch 848: avg train loss 1470.86, bar train loss 2.918, len train loss 0.031, col train loss 131.805


Epoch 849: 1batch [00:00,  9.01batch/s, loss=1.46e+3]

epoch 848: avg test  loss 1495.55, bar  test loss 3.468, len  test loss 0.035, col  test loss 134.780


Epoch 849: 272batch [00:32,  8.37batch/s, loss=1.45e+3]


epoch 849: avg train loss 1471.59, bar train loss 2.919, len train loss 0.032, col train loss 132.206


Epoch 850: 1batch [00:00,  9.52batch/s, loss=1.45e+3]

epoch 849: avg test  loss 1492.99, bar  test loss 3.189, len  test loss 0.037, col  test loss 133.661


Epoch 850: 272batch [00:32,  8.42batch/s, loss=1.45e+3]


epoch 850: avg train loss 1473.02, bar train loss 3.130, len train loss 0.032, col train loss 132.196
epoch 850: avg test  loss 1488.81, bar  test loss 3.025, len  test loss 0.035, col  test loss 134.034


Epoch 851: 272batch [00:32,  8.30batch/s, loss=1.43e+3]


epoch 851: avg train loss 1469.79, bar train loss 2.908, len train loss 0.031, col train loss 131.838


Epoch 852: 1batch [00:00,  8.85batch/s, loss=1.38e+3]

epoch 851: avg test  loss 1485.52, bar  test loss 3.044, len  test loss 0.034, col  test loss 133.505


Epoch 852: 272batch [00:32,  8.33batch/s, loss=1.62e+3]


epoch 852: avg train loss 1469.34, bar train loss 2.907, len train loss 0.032, col train loss 132.039


Epoch 853: 1batch [00:00,  8.85batch/s, loss=1.54e+3]

epoch 852: avg test  loss 1494.61, bar  test loss 3.284, len  test loss 0.043, col  test loss 134.678


Epoch 853: 272batch [00:32,  8.28batch/s, loss=1.57e+3]


epoch 853: avg train loss 1473.32, bar train loss 2.945, len train loss 0.033, col train loss 132.134


Epoch 854: 1batch [00:00,  8.40batch/s, loss=1.47e+3]

epoch 853: avg test  loss 1495.34, bar  test loss 3.154, len  test loss 0.036, col  test loss 133.295


Epoch 854: 272batch [00:32,  8.34batch/s, loss=1.44e+3]


epoch 854: avg train loss 1471.47, bar train loss 2.967, len train loss 0.032, col train loss 131.653


Epoch 855: 1batch [00:00,  9.09batch/s, loss=1.47e+3]

epoch 854: avg test  loss 1496.27, bar  test loss 3.504, len  test loss 0.035, col  test loss 133.602


Epoch 855: 272batch [00:32,  8.39batch/s, loss=1.52e+3]


epoch 855: avg train loss 1473.60, bar train loss 3.021, len train loss 0.032, col train loss 132.161
epoch 855: avg test  loss 1493.80, bar  test loss 3.246, len  test loss 0.036, col  test loss 134.565


Epoch 856: 272batch [00:32,  8.38batch/s, loss=1.44e+3]


epoch 856: avg train loss 1472.63, bar train loss 2.913, len train loss 0.033, col train loss 131.996


Epoch 857: 1batch [00:00,  9.09batch/s, loss=1.47e+3]

epoch 856: avg test  loss 1492.78, bar  test loss 3.166, len  test loss 0.033, col  test loss 133.609


Epoch 857: 272batch [00:32,  8.31batch/s, loss=1.52e+3]


epoch 857: avg train loss 1471.95, bar train loss 2.913, len train loss 0.032, col train loss 132.026


Epoch 858: 1batch [00:00,  8.62batch/s, loss=1.42e+3]

epoch 857: avg test  loss 1495.38, bar  test loss 3.863, len  test loss 0.034, col  test loss 133.444


Epoch 858: 272batch [00:32,  8.34batch/s, loss=1.68e+3]


epoch 858: avg train loss 1478.08, bar train loss 3.011, len train loss 0.033, col train loss 132.611


Epoch 859: 1batch [00:00,  8.47batch/s, loss=1.45e+3]

epoch 858: avg test  loss 1500.01, bar  test loss 3.756, len  test loss 0.033, col  test loss 134.151


Epoch 859: 272batch [00:32,  8.31batch/s, loss=1.53e+3]


epoch 859: avg train loss 1473.06, bar train loss 2.912, len train loss 0.030, col train loss 132.158


Epoch 860: 1batch [00:00,  8.26batch/s, loss=1.51e+3]

epoch 859: avg test  loss 1503.99, bar  test loss 4.416, len  test loss 0.034, col  test loss 133.683


Epoch 860: 272batch [00:32,  8.35batch/s, loss=1.43e+3]


epoch 860: avg train loss 1475.51, bar train loss 3.103, len train loss 0.032, col train loss 132.212
epoch 860: avg test  loss 1495.51, bar  test loss 3.384, len  test loss 0.033, col  test loss 133.801


Epoch 861: 272batch [00:32,  8.29batch/s, loss=1.3e+3] 


epoch 861: avg train loss 1475.92, bar train loss 2.954, len train loss 0.034, col train loss 132.355


Epoch 862: 1batch [00:00,  8.47batch/s, loss=1.44e+3]

epoch 861: avg test  loss 1490.48, bar  test loss 2.995, len  test loss 0.035, col  test loss 133.466


Epoch 862: 272batch [00:32,  8.32batch/s, loss=1.49e+3]


epoch 862: avg train loss 1472.26, bar train loss 2.914, len train loss 0.033, col train loss 132.223


Epoch 863: 1batch [00:00,  8.85batch/s, loss=1.5e+3]

epoch 862: avg test  loss 1492.84, bar  test loss 3.514, len  test loss 0.034, col  test loss 133.737


Epoch 863: 272batch [00:32,  8.33batch/s, loss=1.57e+3]


epoch 863: avg train loss 1474.56, bar train loss 3.039, len train loss 0.032, col train loss 132.245


Epoch 864: 1batch [00:00,  8.70batch/s, loss=1.52e+3]

epoch 863: avg test  loss 1493.15, bar  test loss 3.079, len  test loss 0.034, col  test loss 134.393


Epoch 864: 272batch [00:32,  8.34batch/s, loss=1.47e+3]


epoch 864: avg train loss 1477.68, bar train loss 2.953, len train loss 0.033, col train loss 132.776


Epoch 865: 1batch [00:00,  8.85batch/s, loss=1.43e+3]

epoch 864: avg test  loss 1502.20, bar  test loss 3.183, len  test loss 0.039, col  test loss 135.646


Epoch 865: 272batch [00:32,  8.28batch/s, loss=1.38e+3]


epoch 865: avg train loss 1476.02, bar train loss 2.991, len train loss 0.032, col train loss 132.426
epoch 865: avg test  loss 1506.68, bar  test loss 4.145, len  test loss 0.034, col  test loss 134.947


Epoch 866: 272batch [00:32,  8.36batch/s, loss=1.4e+3] 


epoch 866: avg train loss 1476.91, bar train loss 3.023, len train loss 0.033, col train loss 132.415


Epoch 867: 1batch [00:00,  8.85batch/s, loss=1.5e+3]

epoch 866: avg test  loss 1500.98, bar  test loss 3.840, len  test loss 0.037, col  test loss 134.194


Epoch 867: 272batch [00:32,  8.29batch/s, loss=1.47e+3]


epoch 867: avg train loss 1477.76, bar train loss 3.056, len train loss 0.034, col train loss 132.671


Epoch 868: 1batch [00:00,  8.33batch/s, loss=1.43e+3]

epoch 867: avg test  loss 1494.69, bar  test loss 3.233, len  test loss 0.035, col  test loss 134.502


Epoch 868: 272batch [00:32,  8.33batch/s, loss=1.33e+3]


epoch 868: avg train loss 1474.02, bar train loss 2.890, len train loss 0.032, col train loss 132.198


Epoch 869: 1batch [00:00,  9.90batch/s, loss=1.39e+3]

epoch 868: avg test  loss 1493.47, bar  test loss 3.174, len  test loss 0.035, col  test loss 133.465


Epoch 869: 272batch [00:32,  8.25batch/s, loss=1.41e+3]


epoch 869: avg train loss 1476.59, bar train loss 3.027, len train loss 0.033, col train loss 132.627


Epoch 870: 0batch [00:00, ?batch/s, loss=1.41e+3]

epoch 869: avg test  loss 1495.80, bar  test loss 3.226, len  test loss 0.035, col  test loss 134.509


Epoch 870: 272batch [00:33,  8.20batch/s, loss=1.45e+3]


epoch 870: avg train loss 1477.81, bar train loss 2.977, len train loss 0.033, col train loss 132.547
epoch 870: avg test  loss 1501.24, bar  test loss 3.407, len  test loss 0.037, col  test loss 135.347


Epoch 871: 272batch [00:33,  8.21batch/s, loss=1.43e+3]


epoch 871: avg train loss 1477.82, bar train loss 3.126, len train loss 0.033, col train loss 132.662


Epoch 872: 1batch [00:00,  9.62batch/s, loss=1.42e+3]

epoch 871: avg test  loss 1496.03, bar  test loss 3.444, len  test loss 0.037, col  test loss 134.031


Epoch 872: 272batch [00:33,  8.24batch/s, loss=1.32e+3]


epoch 872: avg train loss 1478.18, bar train loss 2.983, len train loss 0.032, col train loss 132.733


Epoch 873: 1batch [00:00,  9.01batch/s, loss=1.51e+3]

epoch 872: avg test  loss 1493.85, bar  test loss 2.954, len  test loss 0.036, col  test loss 134.842


Epoch 873: 272batch [00:33,  8.12batch/s, loss=1.5e+3] 


epoch 873: avg train loss 1479.13, bar train loss 3.019, len train loss 0.032, col train loss 132.871


Epoch 874: 1batch [00:00,  8.62batch/s, loss=1.52e+3]

epoch 873: avg test  loss 1499.58, bar  test loss 3.271, len  test loss 0.035, col  test loss 134.905


Epoch 874: 272batch [00:33,  8.19batch/s, loss=1.57e+3]


epoch 874: avg train loss 1475.08, bar train loss 2.918, len train loss 0.032, col train loss 132.553


Epoch 875: 1batch [00:00,  9.01batch/s, loss=1.54e+3]

epoch 874: avg test  loss 1497.35, bar  test loss 3.140, len  test loss 0.033, col  test loss 134.726


Epoch 875: 272batch [00:32,  8.24batch/s, loss=1.65e+3]


epoch 875: avg train loss 1476.73, bar train loss 2.927, len train loss 0.032, col train loss 132.409
epoch 875: avg test  loss 1494.38, bar  test loss 3.091, len  test loss 0.035, col  test loss 133.847


Epoch 876: 272batch [00:33,  8.08batch/s, loss=1.49e+3]


epoch 876: avg train loss 1478.00, bar train loss 2.953, len train loss 0.033, col train loss 132.580


Epoch 877: 1batch [00:00,  9.26batch/s, loss=1.44e+3]

epoch 876: avg test  loss 1494.10, bar  test loss 3.002, len  test loss 0.037, col  test loss 134.070


Epoch 877: 272batch [00:32,  8.25batch/s, loss=1.46e+3]


epoch 877: avg train loss 1479.79, bar train loss 2.991, len train loss 0.033, col train loss 133.046


Epoch 878: 1batch [00:00,  9.01batch/s, loss=1.46e+3]

epoch 877: avg test  loss 1504.53, bar  test loss 4.051, len  test loss 0.034, col  test loss 134.153


Epoch 878: 272batch [00:33,  8.18batch/s, loss=1.48e+3]


epoch 878: avg train loss 1478.72, bar train loss 3.046, len train loss 0.033, col train loss 132.808


Epoch 879: 1batch [00:00,  8.55batch/s, loss=1.39e+3]

epoch 878: avg test  loss 1500.04, bar  test loss 3.048, len  test loss 0.036, col  test loss 134.216


Epoch 879: 272batch [00:33,  8.20batch/s, loss=1.46e+3]


epoch 879: avg train loss 1479.97, bar train loss 3.029, len train loss 0.034, col train loss 132.939


Epoch 880: 1batch [00:00,  8.62batch/s, loss=1.39e+3]

epoch 879: avg test  loss 1499.16, bar  test loss 2.989, len  test loss 0.035, col  test loss 134.782


Epoch 880: 272batch [00:32,  8.26batch/s, loss=1.4e+3] 


epoch 880: avg train loss 1480.23, bar train loss 2.986, len train loss 0.033, col train loss 132.860
epoch 880: avg test  loss 1504.14, bar  test loss 3.306, len  test loss 0.046, col  test loss 135.643


Epoch 881: 272batch [00:33,  8.22batch/s, loss=1.28e+3]


epoch 881: avg train loss 1480.40, bar train loss 3.034, len train loss 0.032, col train loss 133.177


Epoch 882: 1batch [00:00,  8.47batch/s, loss=1.53e+3]

epoch 881: avg test  loss 1503.30, bar  test loss 3.459, len  test loss 0.035, col  test loss 134.808


Epoch 882: 272batch [00:33,  8.12batch/s, loss=1.54e+3]


epoch 882: avg train loss 1478.32, bar train loss 2.967, len train loss 0.034, col train loss 132.794


Epoch 883: 1batch [00:00,  9.09batch/s, loss=1.56e+3]

epoch 882: avg test  loss 1496.86, bar  test loss 3.009, len  test loss 0.034, col  test loss 134.910


Epoch 883: 272batch [00:33,  8.18batch/s, loss=1.37e+3]


epoch 883: avg train loss 1477.98, bar train loss 2.923, len train loss 0.032, col train loss 132.543


Epoch 884: 1batch [00:00,  9.43batch/s, loss=1.44e+3]

epoch 883: avg test  loss 1507.22, bar  test loss 3.555, len  test loss 0.036, col  test loss 134.393


Epoch 884: 272batch [00:33,  8.14batch/s, loss=1.65e+3]


epoch 884: avg train loss 1482.40, bar train loss 3.055, len train loss 0.033, col train loss 133.099


Epoch 885: 1batch [00:00,  9.17batch/s, loss=1.47e+3]

epoch 884: avg test  loss 1504.06, bar  test loss 3.377, len  test loss 0.034, col  test loss 135.300


Epoch 885: 272batch [00:33,  8.17batch/s, loss=1.52e+3]


epoch 885: avg train loss 1481.69, bar train loss 2.987, len train loss 0.033, col train loss 132.868
epoch 885: avg test  loss 1497.21, bar  test loss 3.092, len  test loss 0.035, col  test loss 134.484


Epoch 886: 272batch [00:33,  8.14batch/s, loss=1.39e+3]


epoch 886: avg train loss 1480.00, bar train loss 3.018, len train loss 0.034, col train loss 132.955


Epoch 887: 1batch [00:00,  8.70batch/s, loss=1.57e+3]

epoch 886: avg test  loss 1505.83, bar  test loss 3.649, len  test loss 0.036, col  test loss 135.108


Epoch 887: 272batch [00:33,  8.16batch/s, loss=1.44e+3]


epoch 887: avg train loss 1480.41, bar train loss 2.924, len train loss 0.032, col train loss 133.266


Epoch 888: 1batch [00:00,  7.52batch/s, loss=1.46e+3]

epoch 887: avg test  loss 1495.19, bar  test loss 3.022, len  test loss 0.040, col  test loss 134.574


Epoch 888: 272batch [00:33,  8.14batch/s, loss=1.41e+3]


epoch 888: avg train loss 1481.45, bar train loss 3.046, len train loss 0.031, col train loss 132.878


Epoch 889: 1batch [00:00,  8.33batch/s, loss=1.48e+3]

epoch 888: avg test  loss 1502.84, bar  test loss 3.161, len  test loss 0.035, col  test loss 135.413


Epoch 889: 272batch [00:33,  8.10batch/s, loss=1.48e+3]


epoch 889: avg train loss 1482.82, bar train loss 3.018, len train loss 0.033, col train loss 133.125


Epoch 890: 1batch [00:00,  9.01batch/s, loss=1.5e+3]

epoch 889: avg test  loss 1497.56, bar  test loss 3.303, len  test loss 0.034, col  test loss 135.055


Epoch 890: 272batch [00:33,  8.09batch/s, loss=1.62e+3]


epoch 890: avg train loss 1481.82, bar train loss 2.998, len train loss 0.033, col train loss 133.114
epoch 890: avg test  loss 1519.91, bar  test loss 4.092, len  test loss 0.036, col  test loss 135.465


Epoch 891: 272batch [00:33,  8.05batch/s, loss=1.45e+3]


epoch 891: avg train loss 1485.70, bar train loss 3.099, len train loss 0.033, col train loss 133.369


Epoch 892: 1batch [00:00,  8.62batch/s, loss=1.45e+3]

epoch 891: avg test  loss 1501.47, bar  test loss 3.139, len  test loss 0.037, col  test loss 135.084


Epoch 892: 272batch [00:33,  8.12batch/s, loss=1.52e+3]


epoch 892: avg train loss 1481.43, bar train loss 3.039, len train loss 0.033, col train loss 132.842


Epoch 893: 1batch [00:00,  7.09batch/s, loss=1.46e+3]

epoch 892: avg test  loss 1501.32, bar  test loss 3.374, len  test loss 0.035, col  test loss 134.871


Epoch 893: 272batch [00:33,  8.00batch/s, loss=1.44e+3]


epoch 893: avg train loss 1479.30, bar train loss 3.066, len train loss 0.033, col train loss 132.874


Epoch 894: 1batch [00:00,  8.85batch/s, loss=1.52e+3]

epoch 893: avg test  loss 1501.85, bar  test loss 3.397, len  test loss 0.036, col  test loss 134.661


Epoch 894: 272batch [00:34,  7.97batch/s, loss=1.43e+3]


epoch 894: avg train loss 1480.71, bar train loss 2.971, len train loss 0.034, col train loss 133.077


Epoch 895: 1batch [00:00,  8.85batch/s, loss=1.5e+3]

epoch 894: avg test  loss 1498.08, bar  test loss 3.080, len  test loss 0.036, col  test loss 135.820


Epoch 895: 272batch [00:33,  8.14batch/s, loss=1.54e+3]


epoch 895: avg train loss 1481.61, bar train loss 2.990, len train loss 0.033, col train loss 133.110
epoch 895: avg test  loss 1505.65, bar  test loss 3.646, len  test loss 0.035, col  test loss 134.549


Epoch 896: 272batch [00:33,  8.06batch/s, loss=1.5e+3] 


epoch 896: avg train loss 1481.52, bar train loss 2.964, len train loss 0.033, col train loss 133.031


Epoch 897: 1batch [00:00,  7.81batch/s, loss=1.48e+3]

epoch 896: avg test  loss 1508.95, bar  test loss 4.039, len  test loss 0.036, col  test loss 134.558


Epoch 897: 272batch [00:33,  8.11batch/s, loss=1.54e+3]


epoch 897: avg train loss 1482.95, bar train loss 3.040, len train loss 0.034, col train loss 133.214


Epoch 898: 1batch [00:00,  8.93batch/s, loss=1.46e+3]

epoch 897: avg test  loss 1511.75, bar  test loss 3.028, len  test loss 0.037, col  test loss 134.874


Epoch 898: 272batch [00:33,  8.08batch/s, loss=1.47e+3]


epoch 898: avg train loss 1484.80, bar train loss 3.037, len train loss 0.032, col train loss 133.330


Epoch 899: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 898: avg test  loss 1501.49, bar  test loss 3.136, len  test loss 0.034, col  test loss 134.959


Epoch 899: 272batch [00:33,  8.10batch/s, loss=1.43e+3]


epoch 899: avg train loss 1481.09, bar train loss 2.982, len train loss 0.033, col train loss 133.126


Epoch 900: 1batch [00:00,  9.43batch/s, loss=1.47e+3]

epoch 899: avg test  loss 1504.69, bar  test loss 3.178, len  test loss 0.034, col  test loss 134.631


Epoch 900: 272batch [00:33,  8.07batch/s, loss=1.53e+3]


epoch 900: avg train loss 1483.34, bar train loss 2.984, len train loss 0.032, col train loss 133.141
epoch 900: avg test  loss 1499.91, bar  test loss 3.181, len  test loss 0.037, col  test loss 134.842


Epoch 901: 272batch [00:33,  8.04batch/s, loss=1.38e+3]


epoch 901: avg train loss 1482.81, bar train loss 2.987, len train loss 0.032, col train loss 133.266


Epoch 902: 1batch [00:00,  9.09batch/s, loss=1.45e+3]

epoch 901: avg test  loss 1508.64, bar  test loss 3.462, len  test loss 0.038, col  test loss 134.113


Epoch 902: 272batch [00:33,  8.02batch/s, loss=1.42e+3]


epoch 902: avg train loss 1484.14, bar train loss 3.166, len train loss 0.033, col train loss 133.141


Epoch 903: 1batch [00:00,  8.93batch/s, loss=1.45e+3]

epoch 902: avg test  loss 1500.02, bar  test loss 3.078, len  test loss 0.039, col  test loss 135.255


Epoch 903: 272batch [00:33,  8.02batch/s, loss=1.59e+3]


epoch 903: avg train loss 1485.30, bar train loss 3.046, len train loss 0.032, col train loss 133.459


Epoch 904: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 903: avg test  loss 1519.93, bar  test loss 5.187, len  test loss 0.036, col  test loss 135.172


Epoch 904: 272batch [00:33,  8.08batch/s, loss=1.4e+3] 


epoch 904: avg train loss 1486.05, bar train loss 3.030, len train loss 0.033, col train loss 133.541


Epoch 905: 1batch [00:00,  9.43batch/s, loss=1.48e+3]

epoch 904: avg test  loss 1503.20, bar  test loss 3.352, len  test loss 0.036, col  test loss 134.596


Epoch 905: 272batch [00:33,  8.06batch/s, loss=1.5e+3] 


epoch 905: avg train loss 1483.80, bar train loss 3.069, len train loss 0.033, col train loss 133.235
epoch 905: avg test  loss 1499.12, bar  test loss 3.274, len  test loss 0.034, col  test loss 134.967


Epoch 906: 272batch [00:33,  8.07batch/s, loss=1.49e+3]


epoch 906: avg train loss 1485.68, bar train loss 3.118, len train loss 0.032, col train loss 133.516


Epoch 907: 1batch [00:00,  8.55batch/s, loss=1.42e+3]

epoch 906: avg test  loss 1509.27, bar  test loss 3.651, len  test loss 0.034, col  test loss 135.356


Epoch 907: 272batch [00:33,  8.03batch/s, loss=1.48e+3]


epoch 907: avg train loss 1485.66, bar train loss 3.063, len train loss 0.032, col train loss 133.540


Epoch 908: 1batch [00:00,  9.43batch/s, loss=1.49e+3]

epoch 907: avg test  loss 1504.47, bar  test loss 3.306, len  test loss 0.033, col  test loss 135.380


Epoch 908: 272batch [00:34,  8.00batch/s, loss=1.4e+3] 


epoch 908: avg train loss 1483.59, bar train loss 3.137, len train loss 0.033, col train loss 133.205


Epoch 909: 1batch [00:00,  8.26batch/s, loss=1.49e+3]

epoch 908: avg test  loss 1501.35, bar  test loss 3.022, len  test loss 0.038, col  test loss 135.559


Epoch 909: 272batch [00:33,  8.02batch/s, loss=1.53e+3]


epoch 909: avg train loss 1484.94, bar train loss 3.003, len train loss 0.034, col train loss 133.507


Epoch 910: 1batch [00:00,  8.47batch/s, loss=1.5e+3]

epoch 909: avg test  loss 1500.51, bar  test loss 3.135, len  test loss 0.034, col  test loss 135.476


Epoch 910: 272batch [00:33,  8.09batch/s, loss=1.52e+3]


epoch 910: avg train loss 1485.17, bar train loss 3.070, len train loss 0.034, col train loss 133.405
epoch 910: avg test  loss 1501.65, bar  test loss 3.453, len  test loss 0.036, col  test loss 135.039


Epoch 911: 272batch [00:34,  7.95batch/s, loss=1.66e+3]


epoch 911: avg train loss 1483.41, bar train loss 2.992, len train loss 0.033, col train loss 133.267


Epoch 912: 1batch [00:00,  8.20batch/s, loss=1.49e+3]

epoch 911: avg test  loss 1501.37, bar  test loss 3.254, len  test loss 0.035, col  test loss 135.421


Epoch 912: 272batch [00:34,  7.96batch/s, loss=1.43e+3]


epoch 912: avg train loss 1489.05, bar train loss 3.211, len train loss 0.035, col train loss 133.667


Epoch 913: 1batch [00:00,  8.62batch/s, loss=1.5e+3]

epoch 912: avg test  loss 1506.96, bar  test loss 3.243, len  test loss 0.039, col  test loss 134.978


Epoch 913: 272batch [00:34,  7.98batch/s, loss=1.49e+3]


epoch 913: avg train loss 1489.30, bar train loss 3.100, len train loss 0.034, col train loss 133.879


Epoch 914: 1batch [00:00,  8.70batch/s, loss=1.48e+3]

epoch 913: avg test  loss 1524.17, bar  test loss 4.242, len  test loss 0.044, col  test loss 136.292


Epoch 914: 272batch [00:33,  8.02batch/s, loss=1.58e+3]


epoch 914: avg train loss 1489.13, bar train loss 3.091, len train loss 0.033, col train loss 133.554


Epoch 915: 1batch [00:00,  7.87batch/s, loss=1.47e+3]

epoch 914: avg test  loss 1505.53, bar  test loss 3.191, len  test loss 0.034, col  test loss 135.727


Epoch 915: 272batch [00:34,  7.88batch/s, loss=1.54e+3]


epoch 915: avg train loss 1487.03, bar train loss 3.117, len train loss 0.033, col train loss 133.759
epoch 915: avg test  loss 1501.08, bar  test loss 3.250, len  test loss 0.037, col  test loss 134.661


Epoch 916: 272batch [00:34,  7.90batch/s, loss=1.45e+3]


epoch 916: avg train loss 1488.08, bar train loss 2.993, len train loss 0.033, col train loss 133.787


Epoch 917: 1batch [00:00,  7.94batch/s, loss=1.47e+3]

epoch 916: avg test  loss 1507.60, bar  test loss 3.234, len  test loss 0.038, col  test loss 135.231


Epoch 917: 272batch [00:34,  7.89batch/s, loss=1.39e+3]


epoch 917: avg train loss 1489.32, bar train loss 3.085, len train loss 0.033, col train loss 133.988


Epoch 918: 1batch [00:00,  8.77batch/s, loss=1.46e+3]

epoch 917: avg test  loss 1517.73, bar  test loss 4.521, len  test loss 0.035, col  test loss 135.733


Epoch 918: 272batch [00:34,  7.96batch/s, loss=1.56e+3]


epoch 918: avg train loss 1485.03, bar train loss 3.123, len train loss 0.033, col train loss 133.541


Epoch 919: 1batch [00:00,  9.17batch/s, loss=1.52e+3]

epoch 918: avg test  loss 1507.08, bar  test loss 3.367, len  test loss 0.038, col  test loss 135.665


Epoch 919: 272batch [00:33,  8.01batch/s, loss=1.53e+3]


epoch 919: avg train loss 1490.69, bar train loss 3.094, len train loss 0.035, col train loss 133.871


Epoch 920: 1batch [00:00,  9.01batch/s, loss=1.54e+3]

epoch 919: avg test  loss 1580.85, bar  test loss 9.348, len  test loss 0.043, col  test loss 136.797


Epoch 920: 272batch [00:34,  7.97batch/s, loss=1.46e+3]


epoch 920: avg train loss 1487.45, bar train loss 3.144, len train loss 0.033, col train loss 133.712
epoch 920: avg test  loss 1511.95, bar  test loss 3.522, len  test loss 0.035, col  test loss 135.634


Epoch 921: 272batch [00:34,  7.91batch/s, loss=1.49e+3]


epoch 921: avg train loss 1488.20, bar train loss 3.041, len train loss 0.033, col train loss 133.837


Epoch 922: 1batch [00:00,  8.77batch/s, loss=1.56e+3]

epoch 921: avg test  loss 1511.01, bar  test loss 3.741, len  test loss 0.035, col  test loss 135.598


Epoch 922: 272batch [00:34,  7.95batch/s, loss=1.51e+3]


epoch 922: avg train loss 1489.60, bar train loss 3.092, len train loss 0.033, col train loss 133.946


Epoch 923: 1batch [00:00,  8.70batch/s, loss=1.44e+3]

epoch 922: avg test  loss 1507.42, bar  test loss 3.189, len  test loss 0.036, col  test loss 135.864


Epoch 923: 272batch [00:34,  7.94batch/s, loss=1.52e+3]


epoch 923: avg train loss 1492.28, bar train loss 3.082, len train loss 0.033, col train loss 134.261


Epoch 924: 1batch [00:00,  8.77batch/s, loss=1.52e+3]

epoch 923: avg test  loss 1515.56, bar  test loss 3.135, len  test loss 0.041, col  test loss 136.391


Epoch 924: 272batch [00:34,  7.95batch/s, loss=1.47e+3]


epoch 924: avg train loss 1490.97, bar train loss 3.058, len train loss 0.033, col train loss 134.093


Epoch 925: 1batch [00:00,  8.20batch/s, loss=1.51e+3]

epoch 924: avg test  loss 1504.34, bar  test loss 3.182, len  test loss 0.034, col  test loss 135.240


Epoch 925: 272batch [00:34,  7.91batch/s, loss=1.48e+3]


epoch 925: avg train loss 1491.55, bar train loss 3.090, len train loss 0.032, col train loss 134.241
epoch 925: avg test  loss 1516.89, bar  test loss 3.548, len  test loss 0.036, col  test loss 136.405


Epoch 926: 272batch [00:34,  7.96batch/s, loss=1.43e+3]


epoch 926: avg train loss 1487.89, bar train loss 3.098, len train loss 0.032, col train loss 133.584


Epoch 927: 1batch [00:00,  8.40batch/s, loss=1.48e+3]

epoch 926: avg test  loss 1512.76, bar  test loss 3.403, len  test loss 0.036, col  test loss 135.983


Epoch 927: 272batch [00:34,  7.92batch/s, loss=1.63e+3]


epoch 927: avg train loss 1490.68, bar train loss 3.024, len train loss 0.032, col train loss 133.978


Epoch 928: 1batch [00:00,  8.20batch/s, loss=1.51e+3]

epoch 927: avg test  loss 1510.34, bar  test loss 3.588, len  test loss 0.034, col  test loss 135.539


Epoch 928: 272batch [00:34,  7.88batch/s, loss=1.61e+3]


epoch 928: avg train loss 1491.85, bar train loss 3.254, len train loss 0.033, col train loss 133.851


Epoch 929: 1batch [00:00,  8.85batch/s, loss=1.58e+3]

epoch 928: avg test  loss 1504.25, bar  test loss 3.135, len  test loss 0.034, col  test loss 134.934


Epoch 929: 272batch [00:34,  7.91batch/s, loss=1.45e+3]


epoch 929: avg train loss 1488.18, bar train loss 3.021, len train loss 0.033, col train loss 133.788


Epoch 930: 1batch [00:00,  9.43batch/s, loss=1.45e+3]

epoch 929: avg test  loss 1504.71, bar  test loss 3.057, len  test loss 0.035, col  test loss 136.067


Epoch 930: 272batch [00:34,  7.92batch/s, loss=1.42e+3]


epoch 930: avg train loss 1492.08, bar train loss 3.093, len train loss 0.034, col train loss 134.297
epoch 930: avg test  loss 1507.42, bar  test loss 3.191, len  test loss 0.041, col  test loss 135.117


Epoch 931: 272batch [00:34,  7.92batch/s, loss=1.53e+3]


epoch 931: avg train loss 1493.49, bar train loss 3.152, len train loss 0.034, col train loss 134.277


Epoch 932: 1batch [00:00,  9.01batch/s, loss=1.56e+3]

epoch 931: avg test  loss 1542.47, bar  test loss 6.674, len  test loss 0.035, col  test loss 136.182


Epoch 932: 272batch [00:34,  7.88batch/s, loss=1.57e+3]


epoch 932: avg train loss 1489.39, bar train loss 3.110, len train loss 0.031, col train loss 133.855


Epoch 933: 1batch [00:00,  8.47batch/s, loss=1.54e+3]

epoch 932: avg test  loss 1512.65, bar  test loss 3.745, len  test loss 0.035, col  test loss 135.180


Epoch 933: 272batch [00:34,  7.85batch/s, loss=1.56e+3]


epoch 933: avg train loss 1490.53, bar train loss 3.049, len train loss 0.033, col train loss 134.070


Epoch 934: 1batch [00:00,  9.01batch/s, loss=1.47e+3]

epoch 933: avg test  loss 1507.77, bar  test loss 3.106, len  test loss 0.039, col  test loss 135.962


Epoch 934: 272batch [00:34,  7.86batch/s, loss=1.54e+3]


epoch 934: avg train loss 1492.99, bar train loss 3.280, len train loss 0.033, col train loss 134.040


Epoch 935: 1batch [00:00,  8.85batch/s, loss=1.5e+3]

epoch 934: avg test  loss 1504.09, bar  test loss 3.110, len  test loss 0.034, col  test loss 134.852


Epoch 935: 272batch [00:34,  7.86batch/s, loss=1.48e+3]


epoch 935: avg train loss 1490.65, bar train loss 3.006, len train loss 0.034, col train loss 134.152
epoch 935: avg test  loss 1512.30, bar  test loss 3.807, len  test loss 0.034, col  test loss 135.646


Epoch 936: 272batch [00:34,  7.83batch/s, loss=1.41e+3]


epoch 936: avg train loss 1493.90, bar train loss 3.158, len train loss 0.034, col train loss 134.311


Epoch 937: 1batch [00:00,  9.71batch/s, loss=1.46e+3]

epoch 936: avg test  loss 1518.77, bar  test loss 4.187, len  test loss 0.035, col  test loss 135.599


Epoch 937: 272batch [00:34,  7.77batch/s, loss=1.39e+3]


epoch 937: avg train loss 1491.02, bar train loss 3.122, len train loss 0.032, col train loss 133.940


Epoch 938: 1batch [00:00,  8.62batch/s, loss=1.48e+3]

epoch 937: avg test  loss 1507.75, bar  test loss 3.129, len  test loss 0.035, col  test loss 135.082


Epoch 938: 272batch [00:35,  7.66batch/s, loss=1.46e+3]


epoch 938: avg train loss 1491.08, bar train loss 3.000, len train loss 0.034, col train loss 134.074


Epoch 939: 1batch [00:00,  9.26batch/s, loss=1.47e+3]

epoch 938: avg test  loss 1503.44, bar  test loss 3.267, len  test loss 0.035, col  test loss 135.302


Epoch 939: 272batch [00:35,  7.65batch/s, loss=1.51e+3]


epoch 939: avg train loss 1487.53, bar train loss 3.033, len train loss 0.033, col train loss 133.903


Epoch 940: 1batch [00:00,  8.85batch/s, loss=1.47e+3]

epoch 939: avg test  loss 1507.76, bar  test loss 3.353, len  test loss 0.035, col  test loss 135.389


Epoch 940: 272batch [00:35,  7.60batch/s, loss=1.45e+3]


epoch 940: avg train loss 1490.81, bar train loss 3.152, len train loss 0.033, col train loss 133.961
epoch 940: avg test  loss 1543.72, bar  test loss 6.502, len  test loss 0.038, col  test loss 136.870


Epoch 941: 272batch [00:34,  7.83batch/s, loss=1.55e+3]


epoch 941: avg train loss 1492.10, bar train loss 3.227, len train loss 0.034, col train loss 134.237


Epoch 942: 1batch [00:00,  8.47batch/s, loss=1.46e+3]

epoch 941: avg test  loss 1505.92, bar  test loss 3.272, len  test loss 0.035, col  test loss 134.927


Epoch 942: 272batch [00:34,  7.83batch/s, loss=1.56e+3]


epoch 942: avg train loss 1490.84, bar train loss 3.050, len train loss 0.033, col train loss 134.157


Epoch 943: 1batch [00:00,  8.70batch/s, loss=1.48e+3]

epoch 942: avg test  loss 1513.89, bar  test loss 3.254, len  test loss 0.036, col  test loss 136.901


Epoch 943: 272batch [00:34,  7.81batch/s, loss=1.52e+3]


epoch 943: avg train loss 1494.55, bar train loss 3.098, len train loss 0.031, col train loss 134.459


Epoch 944: 1batch [00:00,  9.09batch/s, loss=1.52e+3]

epoch 943: avg test  loss 1515.95, bar  test loss 3.301, len  test loss 0.033, col  test loss 136.113


Epoch 944: 272batch [00:34,  7.77batch/s, loss=1.43e+3]


epoch 944: avg train loss 1496.66, bar train loss 3.198, len train loss 0.033, col train loss 134.412


Epoch 945: 1batch [00:00,  8.26batch/s, loss=1.52e+3]

epoch 944: avg test  loss 1514.55, bar  test loss 3.505, len  test loss 0.035, col  test loss 135.568


Epoch 945: 272batch [00:35,  7.75batch/s, loss=1.56e+3]


epoch 945: avg train loss 1490.99, bar train loss 3.074, len train loss 0.033, col train loss 134.095
epoch 945: avg test  loss 1513.28, bar  test loss 3.539, len  test loss 0.036, col  test loss 135.756


Epoch 946: 272batch [00:35,  7.75batch/s, loss=1.59e+3]


epoch 946: avg train loss 1493.60, bar train loss 3.185, len train loss 0.034, col train loss 134.284


Epoch 947: 1batch [00:00,  7.63batch/s, loss=1.52e+3]

epoch 946: avg test  loss 1514.61, bar  test loss 3.161, len  test loss 0.036, col  test loss 135.613


Epoch 947: 272batch [00:34,  7.79batch/s, loss=1.59e+3]


epoch 947: avg train loss 1493.46, bar train loss 3.154, len train loss 0.034, col train loss 134.286


Epoch 948: 1batch [00:00,  8.62batch/s, loss=1.54e+3]

epoch 947: avg test  loss 1511.77, bar  test loss 3.154, len  test loss 0.041, col  test loss 135.452


Epoch 948: 272batch [00:34,  7.80batch/s, loss=1.58e+3]


epoch 948: avg train loss 1494.85, bar train loss 3.139, len train loss 0.034, col train loss 134.379


Epoch 949: 1batch [00:00,  8.77batch/s, loss=1.48e+3]

epoch 948: avg test  loss 1518.46, bar  test loss 3.918, len  test loss 0.036, col  test loss 136.190


Epoch 949: 272batch [00:34,  7.79batch/s, loss=1.5e+3] 


epoch 949: avg train loss 1494.15, bar train loss 3.155, len train loss 0.033, col train loss 134.401


Epoch 950: 1batch [00:00,  8.70batch/s, loss=1.53e+3]

epoch 949: avg test  loss 1510.69, bar  test loss 3.576, len  test loss 0.035, col  test loss 135.861


Epoch 950: 272batch [00:35,  7.75batch/s, loss=1.41e+3]


epoch 950: avg train loss 1492.15, bar train loss 3.023, len train loss 0.032, col train loss 134.313
epoch 950: avg test  loss 1517.93, bar  test loss 3.304, len  test loss 0.043, col  test loss 135.870


Epoch 951: 272batch [00:34,  7.78batch/s, loss=1.45e+3]


epoch 951: avg train loss 1494.22, bar train loss 3.101, len train loss 0.033, col train loss 134.349


Epoch 952: 1batch [00:00,  8.62batch/s, loss=1.56e+3]

epoch 951: avg test  loss 1516.32, bar  test loss 3.692, len  test loss 0.035, col  test loss 136.214


Epoch 952: 272batch [00:35,  7.75batch/s, loss=1.51e+3]


epoch 952: avg train loss 1492.98, bar train loss 3.083, len train loss 0.033, col train loss 134.254


Epoch 953: 1batch [00:00,  8.77batch/s, loss=1.54e+3]

epoch 952: avg test  loss 1513.40, bar  test loss 3.617, len  test loss 0.035, col  test loss 136.019


Epoch 953: 272batch [00:35,  7.72batch/s, loss=1.51e+3]


epoch 953: avg train loss 1493.02, bar train loss 3.186, len train loss 0.033, col train loss 134.135


Epoch 954: 1batch [00:00,  8.55batch/s, loss=1.49e+3]

epoch 953: avg test  loss 1509.98, bar  test loss 3.096, len  test loss 0.036, col  test loss 135.772


Epoch 954: 272batch [00:35,  7.74batch/s, loss=1.5e+3] 


epoch 954: avg train loss 1494.86, bar train loss 3.119, len train loss 0.033, col train loss 134.606


Epoch 955: 1batch [00:00,  7.87batch/s, loss=1.48e+3]

epoch 954: avg test  loss 1519.03, bar  test loss 4.009, len  test loss 0.034, col  test loss 135.960


Epoch 955: 272batch [00:35,  7.73batch/s, loss=1.56e+3]


epoch 955: avg train loss 1497.25, bar train loss 3.165, len train loss 0.034, col train loss 134.604
epoch 955: avg test  loss 1511.78, bar  test loss 3.380, len  test loss 0.035, col  test loss 135.785


Epoch 956: 272batch [00:35,  7.76batch/s, loss=1.51e+3]


epoch 956: avg train loss 1496.44, bar train loss 3.101, len train loss 0.033, col train loss 134.588


Epoch 957: 1batch [00:00,  8.47batch/s, loss=1.51e+3]

epoch 956: avg test  loss 1515.71, bar  test loss 3.207, len  test loss 0.042, col  test loss 136.511


Epoch 957: 272batch [00:35,  7.70batch/s, loss=1.55e+3]


epoch 957: avg train loss 1497.96, bar train loss 3.043, len train loss 0.033, col train loss 134.763


Epoch 958: 1batch [00:00,  8.62batch/s, loss=1.45e+3]

epoch 957: avg test  loss 1511.75, bar  test loss 3.186, len  test loss 0.036, col  test loss 136.257


Epoch 958: 272batch [00:35,  7.69batch/s, loss=1.4e+3] 


epoch 958: avg train loss 1497.83, bar train loss 3.207, len train loss 0.035, col train loss 134.789


Epoch 959: 1batch [00:00,  9.01batch/s, loss=1.5e+3]

epoch 958: avg test  loss 1514.88, bar  test loss 3.137, len  test loss 0.037, col  test loss 136.667


Epoch 959: 272batch [00:35,  7.69batch/s, loss=1.43e+3]


epoch 959: avg train loss 1495.19, bar train loss 3.135, len train loss 0.033, col train loss 134.582


Epoch 960: 1batch [00:00,  8.47batch/s, loss=1.53e+3]

epoch 959: avg test  loss 1518.05, bar  test loss 3.423, len  test loss 0.035, col  test loss 136.644


Epoch 960: 272batch [00:35,  7.68batch/s, loss=1.52e+3]


epoch 960: avg train loss 1492.11, bar train loss 3.044, len train loss 0.031, col train loss 134.152
epoch 960: avg test  loss 1512.49, bar  test loss 3.349, len  test loss 0.035, col  test loss 135.865


Epoch 961: 272batch [00:35,  7.75batch/s, loss=1.42e+3]


epoch 961: avg train loss 1494.70, bar train loss 3.177, len train loss 0.033, col train loss 134.432


Epoch 962: 1batch [00:00,  8.85batch/s, loss=1.47e+3]

epoch 961: avg test  loss 1510.37, bar  test loss 3.195, len  test loss 0.036, col  test loss 136.483


Epoch 962: 272batch [00:35,  7.58batch/s, loss=1.58e+3]


epoch 962: avg train loss 1495.35, bar train loss 3.053, len train loss 0.033, col train loss 134.878


Epoch 963: 1batch [00:00,  8.62batch/s, loss=1.5e+3]

epoch 962: avg test  loss 1520.86, bar  test loss 3.995, len  test loss 0.039, col  test loss 136.477


Epoch 963: 272batch [00:35,  7.64batch/s, loss=1.57e+3]


epoch 963: avg train loss 1499.61, bar train loss 3.168, len train loss 0.033, col train loss 135.014


Epoch 964: 1batch [00:00,  8.62batch/s, loss=1.47e+3]

epoch 963: avg test  loss 1519.55, bar  test loss 3.342, len  test loss 0.038, col  test loss 137.038


Epoch 964: 272batch [00:35,  7.68batch/s, loss=1.36e+3]


epoch 964: avg train loss 1497.47, bar train loss 3.212, len train loss 0.032, col train loss 134.454


Epoch 965: 1batch [00:00,  8.77batch/s, loss=1.4e+3]

epoch 964: avg test  loss 1525.98, bar  test loss 4.968, len  test loss 0.035, col  test loss 136.161


Epoch 965: 272batch [00:35,  7.68batch/s, loss=1.47e+3]


epoch 965: avg train loss 1495.95, bar train loss 3.138, len train loss 0.032, col train loss 134.659
epoch 965: avg test  loss 1512.92, bar  test loss 3.303, len  test loss 0.038, col  test loss 136.163


Epoch 966: 272batch [00:35,  7.65batch/s, loss=1.47e+3]


epoch 966: avg train loss 1493.40, bar train loss 3.152, len train loss 0.034, col train loss 134.231


Epoch 967: 1batch [00:00,  9.35batch/s, loss=1.54e+3]

epoch 966: avg test  loss 1510.17, bar  test loss 3.351, len  test loss 0.034, col  test loss 135.603


Epoch 967: 272batch [00:35,  7.66batch/s, loss=1.43e+3]


epoch 967: avg train loss 1495.38, bar train loss 3.158, len train loss 0.033, col train loss 134.669


Epoch 968: 1batch [00:00,  7.63batch/s, loss=1.4e+3]

epoch 967: avg test  loss 1514.70, bar  test loss 3.164, len  test loss 0.038, col  test loss 136.353


Epoch 968: 272batch [00:35,  7.71batch/s, loss=1.41e+3]


epoch 968: avg train loss 1498.32, bar train loss 3.136, len train loss 0.032, col train loss 134.752


Epoch 969: 1batch [00:00,  8.77batch/s, loss=1.49e+3]

epoch 968: avg test  loss 1521.43, bar  test loss 3.582, len  test loss 0.035, col  test loss 136.407


Epoch 969: 272batch [00:35,  7.69batch/s, loss=1.56e+3]


epoch 969: avg train loss 1499.75, bar train loss 3.194, len train loss 0.033, col train loss 135.071


Epoch 970: 1batch [00:00,  8.33batch/s, loss=1.57e+3]

epoch 969: avg test  loss 1514.98, bar  test loss 3.411, len  test loss 0.033, col  test loss 136.611


Epoch 970: 272batch [00:35,  7.66batch/s, loss=1.49e+3]


epoch 970: avg train loss 1498.94, bar train loss 3.151, len train loss 0.034, col train loss 134.931
epoch 970: avg test  loss 1512.21, bar  test loss 3.194, len  test loss 0.033, col  test loss 136.096


Epoch 971: 272batch [00:35,  7.62batch/s, loss=1.48e+3]


epoch 971: avg train loss 1500.89, bar train loss 3.196, len train loss 0.032, col train loss 134.928


Epoch 972: 1batch [00:00,  9.01batch/s, loss=1.47e+3]

epoch 971: avg test  loss 1517.53, bar  test loss 3.547, len  test loss 0.034, col  test loss 136.422


Epoch 972: 272batch [00:35,  7.66batch/s, loss=1.57e+3]


epoch 972: avg train loss 1502.71, bar train loss 3.192, len train loss 0.034, col train loss 135.217


Epoch 973: 1batch [00:00,  8.20batch/s, loss=1.41e+3]

epoch 972: avg test  loss 1519.07, bar  test loss 3.448, len  test loss 0.037, col  test loss 137.228


Epoch 973: 272batch [00:36,  7.50batch/s, loss=1.43e+3]


epoch 973: avg train loss 1495.55, bar train loss 3.105, len train loss 0.033, col train loss 134.698


Epoch 974: 1batch [00:00,  8.55batch/s, loss=1.51e+3]

epoch 973: avg test  loss 1513.92, bar  test loss 3.701, len  test loss 0.036, col  test loss 136.009


Epoch 974: 272batch [00:35,  7.64batch/s, loss=1.51e+3]


epoch 974: avg train loss 1496.25, bar train loss 3.173, len train loss 0.033, col train loss 134.614


Epoch 975: 1batch [00:00,  8.55batch/s, loss=1.47e+3]

epoch 974: avg test  loss 1515.87, bar  test loss 3.322, len  test loss 0.036, col  test loss 136.433


Epoch 975: 272batch [00:35,  7.61batch/s, loss=1.61e+3]


epoch 975: avg train loss 1498.71, bar train loss 3.124, len train loss 0.033, col train loss 134.765
epoch 975: avg test  loss 1519.87, bar  test loss 3.890, len  test loss 0.034, col  test loss 136.874


Epoch 976: 272batch [00:35,  7.56batch/s, loss=1.53e+3]


epoch 976: avg train loss 1500.10, bar train loss 3.142, len train loss 0.032, col train loss 135.189


Epoch 977: 1batch [00:00,  7.81batch/s, loss=1.43e+3]

epoch 976: avg test  loss 1514.75, bar  test loss 3.582, len  test loss 0.034, col  test loss 136.375


Epoch 977: 272batch [00:35,  7.58batch/s, loss=1.47e+3]


epoch 977: avg train loss 1499.40, bar train loss 3.230, len train loss 0.033, col train loss 135.043


Epoch 978: 1batch [00:00,  8.77batch/s, loss=1.51e+3]

epoch 977: avg test  loss 1520.04, bar  test loss 3.732, len  test loss 0.039, col  test loss 137.764


Epoch 978: 272batch [00:35,  7.61batch/s, loss=1.63e+3]


epoch 978: avg train loss 1502.45, bar train loss 3.223, len train loss 0.035, col train loss 135.355


Epoch 979: 1batch [00:00,  8.77batch/s, loss=1.53e+3]

epoch 978: avg test  loss 1513.85, bar  test loss 3.407, len  test loss 0.040, col  test loss 136.987


Epoch 979: 272batch [00:35,  7.63batch/s, loss=1.52e+3]


epoch 979: avg train loss 1500.61, bar train loss 3.196, len train loss 0.032, col train loss 134.914


Epoch 980: 1batch [00:00,  8.85batch/s, loss=1.49e+3]

epoch 979: avg test  loss 1515.58, bar  test loss 3.224, len  test loss 0.034, col  test loss 136.382


Epoch 980: 272batch [00:36,  7.52batch/s, loss=1.6e+3] 


epoch 980: avg train loss 1499.30, bar train loss 3.189, len train loss 0.033, col train loss 134.872
epoch 980: avg test  loss 1527.11, bar  test loss 3.966, len  test loss 0.036, col  test loss 136.964


Epoch 981: 272batch [00:35,  7.58batch/s, loss=1.51e+3]


epoch 981: avg train loss 1500.01, bar train loss 3.158, len train loss 0.032, col train loss 135.245


Epoch 982: 1batch [00:00,  8.41batch/s, loss=1.54e+3]

epoch 981: avg test  loss 1519.21, bar  test loss 3.309, len  test loss 0.034, col  test loss 137.274


Epoch 982: 272batch [00:36,  7.52batch/s, loss=1.5e+3] 


epoch 982: avg train loss 1500.58, bar train loss 3.254, len train loss 0.033, col train loss 135.024


Epoch 983: 1batch [00:00,  8.47batch/s, loss=1.51e+3]

epoch 982: avg test  loss 1521.74, bar  test loss 3.313, len  test loss 0.034, col  test loss 137.128


Epoch 983: 272batch [00:35,  7.59batch/s, loss=1.54e+3]


epoch 983: avg train loss 1497.61, bar train loss 3.168, len train loss 0.033, col train loss 134.763


Epoch 984: 1batch [00:00,  8.77batch/s, loss=1.38e+3]

epoch 983: avg test  loss 1518.36, bar  test loss 3.410, len  test loss 0.039, col  test loss 136.061


Epoch 984: 272batch [00:35,  7.65batch/s, loss=1.43e+3]


epoch 984: avg train loss 1501.14, bar train loss 3.283, len train loss 0.035, col train loss 135.074


Epoch 985: 1batch [00:00,  8.77batch/s, loss=1.59e+3]

epoch 984: avg test  loss 1519.69, bar  test loss 3.559, len  test loss 0.038, col  test loss 136.288


Epoch 985: 272batch [00:35,  7.59batch/s, loss=1.56e+3]


epoch 985: avg train loss 1500.91, bar train loss 3.075, len train loss 0.032, col train loss 135.162
epoch 985: avg test  loss 1516.04, bar  test loss 3.398, len  test loss 0.034, col  test loss 136.189


Epoch 986: 272batch [00:36,  7.55batch/s, loss=1.47e+3]


epoch 986: avg train loss 1501.11, bar train loss 3.131, len train loss 0.034, col train loss 135.107


Epoch 987: 1batch [00:00,  6.99batch/s, loss=1.43e+3]

epoch 986: avg test  loss 1521.39, bar  test loss 3.291, len  test loss 0.036, col  test loss 136.496


Epoch 987: 272batch [00:36,  7.54batch/s, loss=1.34e+3]


epoch 987: avg train loss 1505.15, bar train loss 3.234, len train loss 0.037, col train loss 135.643


Epoch 988: 1batch [00:00,  8.70batch/s, loss=1.51e+3]

epoch 987: avg test  loss 1524.51, bar  test loss 3.544, len  test loss 0.038, col  test loss 137.114


Epoch 988: 272batch [00:36,  7.55batch/s, loss=1.56e+3]


epoch 988: avg train loss 1505.66, bar train loss 3.356, len train loss 0.035, col train loss 135.428


Epoch 989: 1batch [00:00,  8.33batch/s, loss=1.53e+3]

epoch 988: avg test  loss 1533.01, bar  test loss 3.122, len  test loss 0.047, col  test loss 139.006


Epoch 989: 272batch [00:35,  7.58batch/s, loss=1.46e+3]


epoch 989: avg train loss 1500.61, bar train loss 3.180, len train loss 0.034, col train loss 135.107


Epoch 990: 1batch [00:00,  8.62batch/s, loss=1.45e+3]

epoch 989: avg test  loss 1524.13, bar  test loss 4.113, len  test loss 0.034, col  test loss 136.697


Epoch 990: 272batch [00:35,  7.59batch/s, loss=1.52e+3]


epoch 990: avg train loss 1500.88, bar train loss 3.215, len train loss 0.033, col train loss 134.904
epoch 990: avg test  loss 1518.41, bar  test loss 3.446, len  test loss 0.041, col  test loss 136.341


Epoch 991: 272batch [00:36,  7.55batch/s, loss=1.49e+3]


epoch 991: avg train loss 1502.95, bar train loss 3.154, len train loss 0.033, col train loss 135.008


Epoch 992: 1batch [00:00,  7.81batch/s, loss=1.58e+3]

epoch 991: avg test  loss 1544.90, bar  test loss 3.685, len  test loss 0.038, col  test loss 139.761


Epoch 992: 272batch [00:36,  7.53batch/s, loss=1.72e+3]


epoch 992: avg train loss 1502.22, bar train loss 3.051, len train loss 0.033, col train loss 135.311


Epoch 993: 1batch [00:00,  8.33batch/s, loss=1.47e+3]

epoch 992: avg test  loss 1525.01, bar  test loss 3.754, len  test loss 0.035, col  test loss 136.416


Epoch 993: 272batch [00:36,  7.55batch/s, loss=1.69e+3]


epoch 993: avg train loss 1504.57, bar train loss 3.222, len train loss 0.034, col train loss 135.508


Epoch 994: 1batch [00:00,  8.47batch/s, loss=1.54e+3]

epoch 993: avg test  loss 1519.90, bar  test loss 3.167, len  test loss 0.034, col  test loss 137.157


Epoch 994: 272batch [00:36,  7.55batch/s, loss=1.48e+3]


epoch 994: avg train loss 1502.86, bar train loss 3.250, len train loss 0.033, col train loss 135.481


Epoch 995: 1batch [00:00,  9.01batch/s, loss=1.53e+3]

epoch 994: avg test  loss 1548.51, bar  test loss 5.373, len  test loss 0.036, col  test loss 138.116


Epoch 995: 272batch [00:36,  7.53batch/s, loss=1.56e+3]


epoch 995: avg train loss 1502.07, bar train loss 3.269, len train loss 0.033, col train loss 135.479
epoch 995: avg test  loss 1521.15, bar  test loss 3.453, len  test loss 0.035, col  test loss 136.758


Epoch 996: 272batch [00:36,  7.52batch/s, loss=1.5e+3] 


epoch 996: avg train loss 1503.20, bar train loss 3.178, len train loss 0.033, col train loss 135.270


Epoch 997: 1batch [00:00,  8.77batch/s, loss=1.56e+3]

epoch 996: avg test  loss 1522.21, bar  test loss 3.423, len  test loss 0.034, col  test loss 137.094


Epoch 997: 272batch [00:36,  7.50batch/s, loss=1.43e+3]


epoch 997: avg train loss 1505.57, bar train loss 3.279, len train loss 0.035, col train loss 135.480


Epoch 998: 1batch [00:00,  8.93batch/s, loss=1.57e+3]

epoch 997: avg test  loss 1524.38, bar  test loss 3.675, len  test loss 0.039, col  test loss 136.704


Epoch 998: 272batch [00:36,  7.49batch/s, loss=1.5e+3] 


epoch 998: avg train loss 1507.60, bar train loss 3.319, len train loss 0.034, col train loss 135.687


Epoch 999: 1batch [00:00,  8.33batch/s, loss=1.44e+3]

epoch 998: avg test  loss 1515.85, bar  test loss 3.169, len  test loss 0.035, col  test loss 136.686


Epoch 999: 272batch [00:36,  7.48batch/s, loss=1.43e+3]


epoch 999: avg train loss 1505.15, bar train loss 3.316, len train loss 0.035, col train loss 135.388


Epoch 1000: 1batch [00:00,  8.20batch/s, loss=1.52e+3]

epoch 999: avg test  loss 1542.81, bar  test loss 4.652, len  test loss 0.037, col  test loss 137.168


Epoch 1000: 272batch [00:36,  7.52batch/s, loss=1.59e+3]


epoch 1000: avg train loss 1504.56, bar train loss 3.256, len train loss 0.034, col train loss 135.354
epoch 1000: avg test  loss 1514.71, bar  test loss 3.140, len  test loss 0.035, col  test loss 136.569


Epoch 1001: 272batch [00:36,  7.50batch/s, loss=1.36e+3]


epoch 1001: avg train loss 1501.44, bar train loss 3.235, len train loss 0.033, col train loss 135.370


Epoch 1002: 1batch [00:00,  7.81batch/s, loss=1.59e+3]

epoch 1001: avg test  loss 1519.57, bar  test loss 3.444, len  test loss 0.036, col  test loss 137.392


Epoch 1002: 272batch [00:37,  7.35batch/s, loss=1.41e+3]


epoch 1002: avg train loss 1503.77, bar train loss 3.153, len train loss 0.035, col train loss 135.336


Epoch 1003: 0batch [00:00, ?batch/s]

epoch 1002: avg test  loss 1524.50, bar  test loss 3.379, len  test loss 0.038, col  test loss 138.393


Epoch 1003: 272batch [00:37,  7.31batch/s, loss=1.48e+3]


epoch 1003: avg train loss 1504.12, bar train loss 3.155, len train loss 0.034, col train loss 135.789


Epoch 1004: 1batch [00:00,  8.70batch/s, loss=1.55e+3]

epoch 1003: avg test  loss 1526.26, bar  test loss 3.746, len  test loss 0.040, col  test loss 137.332


Epoch 1004: 272batch [00:36,  7.35batch/s, loss=1.33e+3]


epoch 1004: avg train loss 1507.82, bar train loss 3.301, len train loss 0.035, col train loss 135.860


Epoch 1005: 1batch [00:00,  7.14batch/s, loss=1.61e+3]

epoch 1004: avg test  loss 1527.10, bar  test loss 4.212, len  test loss 0.034, col  test loss 136.946


Epoch 1005: 272batch [00:36,  7.35batch/s, loss=1.51e+3]


epoch 1005: avg train loss 1506.26, bar train loss 3.243, len train loss 0.034, col train loss 135.710
epoch 1005: avg test  loss 1523.97, bar  test loss 3.744, len  test loss 0.036, col  test loss 136.966


Epoch 1006: 272batch [00:36,  7.48batch/s, loss=1.52e+3]


epoch 1006: avg train loss 1504.37, bar train loss 3.326, len train loss 0.034, col train loss 135.407


Epoch 1007: 1batch [00:00,  7.41batch/s, loss=1.56e+3]

epoch 1006: avg test  loss 1524.40, bar  test loss 3.464, len  test loss 0.039, col  test loss 137.676


Epoch 1007: 272batch [00:36,  7.49batch/s, loss=1.46e+3]


epoch 1007: avg train loss 1507.05, bar train loss 3.244, len train loss 0.034, col train loss 135.745


Epoch 1008: 1batch [00:00,  8.40batch/s, loss=1.55e+3]

epoch 1007: avg test  loss 1514.65, bar  test loss 3.183, len  test loss 0.037, col  test loss 136.619


Epoch 1008: 272batch [00:36,  7.47batch/s, loss=1.48e+3]


epoch 1008: avg train loss 1504.07, bar train loss 3.217, len train loss 0.037, col train loss 135.676


Epoch 1009: 1batch [00:00,  8.26batch/s, loss=1.5e+3]

epoch 1008: avg test  loss 1536.14, bar  test loss 4.109, len  test loss 0.040, col  test loss 137.343


Epoch 1009: 272batch [00:36,  7.49batch/s, loss=1.5e+3] 


epoch 1009: avg train loss 1509.26, bar train loss 3.375, len train loss 0.035, col train loss 135.856


Epoch 1010: 1batch [00:00,  8.77batch/s, loss=1.51e+3]

epoch 1009: avg test  loss 1533.67, bar  test loss 3.369, len  test loss 0.037, col  test loss 138.105


Epoch 1010: 272batch [00:36,  7.49batch/s, loss=1.45e+3]


epoch 1010: avg train loss 1505.45, bar train loss 3.159, len train loss 0.034, col train loss 135.892
epoch 1010: avg test  loss 1527.37, bar  test loss 3.585, len  test loss 0.034, col  test loss 137.495


Epoch 1011: 272batch [00:36,  7.46batch/s, loss=1.53e+3]


epoch 1011: avg train loss 1509.55, bar train loss 3.338, len train loss 0.034, col train loss 135.760


Epoch 1012: 1batch [00:00,  7.63batch/s, loss=1.48e+3]

epoch 1011: avg test  loss 1521.71, bar  test loss 3.177, len  test loss 0.039, col  test loss 137.705


Epoch 1012: 272batch [00:36,  7.46batch/s, loss=1.58e+3]


epoch 1012: avg train loss 1505.37, bar train loss 3.172, len train loss 0.035, col train loss 135.786


Epoch 1013: 1batch [00:00,  8.40batch/s, loss=1.56e+3]

epoch 1012: avg test  loss 1534.40, bar  test loss 3.366, len  test loss 0.039, col  test loss 138.804


Epoch 1013: 272batch [00:36,  7.45batch/s, loss=1.43e+3]


epoch 1013: avg train loss 1507.42, bar train loss 3.382, len train loss 0.035, col train loss 135.751


Epoch 1014: 1batch [00:00,  8.40batch/s, loss=1.51e+3]

epoch 1013: avg test  loss 1519.68, bar  test loss 3.290, len  test loss 0.037, col  test loss 135.936


Epoch 1014: 272batch [00:36,  7.41batch/s, loss=1.45e+3]


epoch 1014: avg train loss 1505.95, bar train loss 3.241, len train loss 0.034, col train loss 135.582


Epoch 1015: 1batch [00:00,  8.48batch/s, loss=1.51e+3]

epoch 1014: avg test  loss 1522.06, bar  test loss 3.269, len  test loss 0.035, col  test loss 137.618


Epoch 1015: 272batch [00:36,  7.42batch/s, loss=1.48e+3]


epoch 1015: avg train loss 1506.20, bar train loss 3.151, len train loss 0.035, col train loss 135.631
epoch 1015: avg test  loss 1539.34, bar  test loss 4.534, len  test loss 0.044, col  test loss 136.677


Epoch 1016: 272batch [00:36,  7.43batch/s, loss=1.55e+3]


epoch 1016: avg train loss 1508.81, bar train loss 3.456, len train loss 0.035, col train loss 135.775


Epoch 1017: 1batch [00:00,  7.75batch/s, loss=1.58e+3]

epoch 1016: avg test  loss 1526.13, bar  test loss 3.712, len  test loss 0.036, col  test loss 137.018


Epoch 1017: 272batch [00:36,  7.50batch/s, loss=1.61e+3]


epoch 1017: avg train loss 1511.54, bar train loss 3.534, len train loss 0.035, col train loss 136.271


Epoch 1018: 1batch [00:00,  8.26batch/s, loss=1.52e+3]

epoch 1017: avg test  loss 1521.71, bar  test loss 3.238, len  test loss 0.036, col  test loss 137.234


Epoch 1018: 272batch [00:36,  7.41batch/s, loss=1.55e+3]


epoch 1018: avg train loss 1506.30, bar train loss 3.138, len train loss 0.035, col train loss 135.841


Epoch 1019: 1batch [00:00,  7.58batch/s, loss=1.48e+3]

epoch 1018: avg test  loss 1548.49, bar  test loss 5.125, len  test loss 0.038, col  test loss 137.812


Epoch 1019: 272batch [00:36,  7.42batch/s, loss=1.67e+3]


epoch 1019: avg train loss 1509.14, bar train loss 3.330, len train loss 0.034, col train loss 135.814


Epoch 1020: 1batch [00:00,  8.47batch/s, loss=1.5e+3]

epoch 1019: avg test  loss 1516.30, bar  test loss 3.121, len  test loss 0.036, col  test loss 136.855


Epoch 1020: 272batch [00:36,  7.42batch/s, loss=1.54e+3]


epoch 1020: avg train loss 1506.74, bar train loss 3.239, len train loss 0.033, col train loss 135.628
epoch 1020: avg test  loss 1518.04, bar  test loss 3.351, len  test loss 0.036, col  test loss 136.327


Epoch 1021: 272batch [00:36,  7.41batch/s, loss=1.54e+3]


epoch 1021: avg train loss 1508.45, bar train loss 3.238, len train loss 0.034, col train loss 135.907


Epoch 1022: 1batch [00:00,  8.13batch/s, loss=1.44e+3]

epoch 1021: avg test  loss 1528.30, bar  test loss 3.452, len  test loss 0.038, col  test loss 138.608


Epoch 1022: 272batch [00:36,  7.41batch/s, loss=1.45e+3]


epoch 1022: avg train loss 1510.71, bar train loss 3.225, len train loss 0.034, col train loss 136.049


Epoch 1023: 1batch [00:00,  8.00batch/s, loss=1.47e+3]

epoch 1022: avg test  loss 1523.83, bar  test loss 3.471, len  test loss 0.037, col  test loss 136.212


Epoch 1023: 272batch [00:36,  7.38batch/s, loss=1.54e+3]


epoch 1023: avg train loss 1507.15, bar train loss 3.280, len train loss 0.034, col train loss 135.994


Epoch 1024: 1batch [00:00,  7.94batch/s, loss=1.49e+3]

epoch 1023: avg test  loss 1527.41, bar  test loss 4.066, len  test loss 0.036, col  test loss 137.310


Epoch 1024: 272batch [00:36,  7.41batch/s, loss=1.45e+3]


epoch 1024: avg train loss 1507.60, bar train loss 3.246, len train loss 0.034, col train loss 136.097


Epoch 1025: 1batch [00:00,  7.69batch/s, loss=1.49e+3]

epoch 1024: avg test  loss 1547.90, bar  test loss 5.808, len  test loss 0.036, col  test loss 137.991


Epoch 1025: 272batch [00:36,  7.42batch/s, loss=1.59e+3]


epoch 1025: avg train loss 1508.44, bar train loss 3.323, len train loss 0.034, col train loss 135.894
epoch 1025: avg test  loss 1535.32, bar  test loss 3.824, len  test loss 0.041, col  test loss 136.904


Epoch 1026: 272batch [00:36,  7.39batch/s, loss=1.5e+3] 


epoch 1026: avg train loss 1512.78, bar train loss 3.590, len train loss 0.037, col train loss 136.063


Epoch 1027: 1batch [00:00,  8.55batch/s, loss=1.6e+3]

epoch 1026: avg test  loss 1520.50, bar  test loss 3.234, len  test loss 0.038, col  test loss 136.877


Epoch 1027: 272batch [00:36,  7.43batch/s, loss=1.55e+3]


epoch 1027: avg train loss 1509.07, bar train loss 3.293, len train loss 0.035, col train loss 135.773


Epoch 1028: 1batch [00:00,  8.47batch/s, loss=1.47e+3]

epoch 1027: avg test  loss 1556.55, bar  test loss 6.008, len  test loss 0.038, col  test loss 138.004


Epoch 1028: 272batch [00:37,  7.35batch/s, loss=1.44e+3]


epoch 1028: avg train loss 1512.51, bar train loss 3.407, len train loss 0.035, col train loss 136.353


Epoch 1029: 1batch [00:00,  8.40batch/s, loss=1.47e+3]

epoch 1028: avg test  loss 1525.44, bar  test loss 3.345, len  test loss 0.034, col  test loss 137.350


Epoch 1029: 272batch [00:36,  7.37batch/s, loss=1.41e+3]


epoch 1029: avg train loss 1509.68, bar train loss 3.206, len train loss 0.035, col train loss 135.924


Epoch 1030: 1batch [00:00,  8.70batch/s, loss=1.51e+3]

epoch 1029: avg test  loss 1534.57, bar  test loss 3.598, len  test loss 0.039, col  test loss 138.546


Epoch 1030: 272batch [00:36,  7.36batch/s, loss=1.59e+3]


epoch 1030: avg train loss 1511.96, bar train loss 3.313, len train loss 0.034, col train loss 136.133
epoch 1030: avg test  loss 1525.63, bar  test loss 3.777, len  test loss 0.035, col  test loss 137.516


Epoch 1031: 272batch [00:36,  7.36batch/s, loss=1.6e+3] 


epoch 1031: avg train loss 1511.57, bar train loss 3.339, len train loss 0.035, col train loss 136.189


Epoch 1032: 1batch [00:00,  8.77batch/s, loss=1.59e+3]

epoch 1031: avg test  loss 1524.35, bar  test loss 3.276, len  test loss 0.038, col  test loss 138.353


Epoch 1032: 272batch [00:36,  7.38batch/s, loss=1.37e+3]


epoch 1032: avg train loss 1509.71, bar train loss 3.325, len train loss 0.034, col train loss 135.825


Epoch 1033: 1batch [00:00,  8.85batch/s, loss=1.54e+3]

epoch 1032: avg test  loss 1531.58, bar  test loss 4.218, len  test loss 0.039, col  test loss 136.530


Epoch 1033: 272batch [00:36,  7.42batch/s, loss=1.57e+3]


epoch 1033: avg train loss 1510.38, bar train loss 3.232, len train loss 0.034, col train loss 136.032


Epoch 1034: 1batch [00:00,  8.26batch/s, loss=1.46e+3]

epoch 1033: avg test  loss 1520.95, bar  test loss 3.348, len  test loss 0.037, col  test loss 137.229


Epoch 1034: 272batch [00:36,  7.39batch/s, loss=1.51e+3]


epoch 1034: avg train loss 1509.58, bar train loss 3.318, len train loss 0.033, col train loss 136.094


Epoch 1035: 1batch [00:00,  7.04batch/s, loss=1.53e+3]

epoch 1034: avg test  loss 1529.90, bar  test loss 3.381, len  test loss 0.040, col  test loss 138.144


Epoch 1035: 272batch [00:36,  7.39batch/s, loss=1.55e+3]


epoch 1035: avg train loss 1508.73, bar train loss 3.329, len train loss 0.035, col train loss 136.095
epoch 1035: avg test  loss 1526.98, bar  test loss 3.094, len  test loss 0.034, col  test loss 137.227


Epoch 1036: 272batch [00:37,  7.31batch/s, loss=1.46e+3]


epoch 1036: avg train loss 1512.84, bar train loss 3.263, len train loss 0.034, col train loss 136.190


Epoch 1037: 1batch [00:00,  7.94batch/s, loss=1.44e+3]

epoch 1036: avg test  loss 1531.43, bar  test loss 3.319, len  test loss 0.038, col  test loss 137.821


Epoch 1037: 272batch [00:37,  7.30batch/s, loss=1.49e+3]


epoch 1037: avg train loss 1510.89, bar train loss 3.177, len train loss 0.034, col train loss 136.028


Epoch 1038: 1batch [00:00,  8.40batch/s, loss=1.54e+3]

epoch 1037: avg test  loss 1524.20, bar  test loss 3.518, len  test loss 0.034, col  test loss 136.557


Epoch 1038: 272batch [00:36,  7.39batch/s, loss=1.35e+3]


epoch 1038: avg train loss 1510.21, bar train loss 3.351, len train loss 0.033, col train loss 135.998


Epoch 1039: 1batch [00:00,  8.47batch/s, loss=1.52e+3]

epoch 1038: avg test  loss 1524.36, bar  test loss 3.439, len  test loss 0.038, col  test loss 137.133


Epoch 1039: 272batch [00:36,  7.37batch/s, loss=1.41e+3]


epoch 1039: avg train loss 1510.04, bar train loss 3.259, len train loss 0.034, col train loss 136.186


Epoch 1040: 1batch [00:00,  8.26batch/s, loss=1.58e+3]

epoch 1039: avg test  loss 1523.79, bar  test loss 3.365, len  test loss 0.040, col  test loss 137.953


Epoch 1040: 272batch [00:37,  7.33batch/s, loss=1.61e+3]


epoch 1040: avg train loss 1512.99, bar train loss 3.237, len train loss 0.037, col train loss 136.783
epoch 1040: avg test  loss 1545.89, bar  test loss 4.482, len  test loss 0.048, col  test loss 138.944


Epoch 1041: 272batch [00:36,  7.36batch/s, loss=1.39e+3]


epoch 1041: avg train loss 1515.57, bar train loss 3.402, len train loss 0.034, col train loss 136.317


Epoch 1042: 1batch [00:00,  9.01batch/s, loss=1.52e+3]

epoch 1041: avg test  loss 1525.22, bar  test loss 3.208, len  test loss 0.037, col  test loss 137.554


Epoch 1042: 272batch [00:37,  7.18batch/s, loss=1.5e+3] 


epoch 1042: avg train loss 1511.48, bar train loss 3.230, len train loss 0.034, col train loss 136.241


Epoch 1043: 1batch [00:00,  9.17batch/s, loss=1.46e+3]

epoch 1042: avg test  loss 1526.66, bar  test loss 3.408, len  test loss 0.037, col  test loss 137.231


Epoch 1043: 272batch [00:37,  7.17batch/s, loss=1.45e+3]


epoch 1043: avg train loss 1516.18, bar train loss 3.296, len train loss 0.037, col train loss 136.424


Epoch 1044: 1batch [00:00,  8.13batch/s, loss=1.55e+3]

epoch 1043: avg test  loss 1526.39, bar  test loss 3.273, len  test loss 0.036, col  test loss 136.685


Epoch 1044: 272batch [00:37,  7.22batch/s, loss=1.44e+3]


epoch 1044: avg train loss 1510.38, bar train loss 3.286, len train loss 0.034, col train loss 135.892


Epoch 1045: 1batch [00:00,  8.13batch/s, loss=1.5e+3]

epoch 1044: avg test  loss 1539.35, bar  test loss 4.030, len  test loss 0.038, col  test loss 137.762


Epoch 1045: 272batch [00:37,  7.20batch/s, loss=1.48e+3]


epoch 1045: avg train loss 1512.58, bar train loss 3.325, len train loss 0.035, col train loss 136.431
epoch 1045: avg test  loss 1536.39, bar  test loss 4.453, len  test loss 0.038, col  test loss 137.994


Epoch 1046: 272batch [00:37,  7.26batch/s, loss=1.59e+3]


epoch 1046: avg train loss 1517.94, bar train loss 3.573, len train loss 0.035, col train loss 136.660


Epoch 1047: 1batch [00:00,  7.69batch/s, loss=1.47e+3]

epoch 1046: avg test  loss 1524.24, bar  test loss 3.327, len  test loss 0.037, col  test loss 137.631


Epoch 1047: 272batch [00:37,  7.30batch/s, loss=1.42e+3]


epoch 1047: avg train loss 1514.28, bar train loss 3.277, len train loss 0.034, col train loss 136.518


Epoch 1048: 1batch [00:00,  8.93batch/s, loss=1.48e+3]

epoch 1047: avg test  loss 1547.35, bar  test loss 4.883, len  test loss 0.038, col  test loss 138.076


Epoch 1048: 272batch [00:36,  7.37batch/s, loss=1.41e+3]


epoch 1048: avg train loss 1516.84, bar train loss 3.387, len train loss 0.035, col train loss 136.560


Epoch 1049: 1batch [00:00,  7.94batch/s, loss=1.45e+3]

epoch 1048: avg test  loss 1525.66, bar  test loss 3.420, len  test loss 0.034, col  test loss 137.230


Epoch 1049: 272batch [00:37,  7.26batch/s, loss=1.5e+3] 


epoch 1049: avg train loss 1510.59, bar train loss 3.298, len train loss 0.033, col train loss 136.182


Epoch 1050: 1batch [00:00,  8.62batch/s, loss=1.56e+3]

epoch 1049: avg test  loss 1529.80, bar  test loss 3.346, len  test loss 0.037, col  test loss 138.232


Epoch 1050: 272batch [00:37,  7.32batch/s, loss=1.46e+3]


epoch 1050: avg train loss 1511.22, bar train loss 3.199, len train loss 0.033, col train loss 136.236
epoch 1050: avg test  loss 1539.05, bar  test loss 4.705, len  test loss 0.037, col  test loss 137.713


Epoch 1051: 272batch [00:37,  7.28batch/s, loss=1.64e+3]


epoch 1051: avg train loss 1515.96, bar train loss 3.350, len train loss 0.035, col train loss 136.491


Epoch 1052: 1batch [00:00,  8.47batch/s, loss=1.47e+3]

epoch 1051: avg test  loss 1525.36, bar  test loss 3.308, len  test loss 0.035, col  test loss 136.734


Epoch 1052: 272batch [00:37,  7.29batch/s, loss=1.59e+3]


epoch 1052: avg train loss 1511.52, bar train loss 3.241, len train loss 0.034, col train loss 136.530


Epoch 1053: 1batch [00:00,  8.26batch/s, loss=1.57e+3]

epoch 1052: avg test  loss 1526.55, bar  test loss 3.284, len  test loss 0.041, col  test loss 138.159


Epoch 1053: 272batch [00:37,  7.25batch/s, loss=1.59e+3]


epoch 1053: avg train loss 1511.92, bar train loss 3.239, len train loss 0.035, col train loss 136.287


Epoch 1054: 1batch [00:00,  8.55batch/s, loss=1.51e+3]

epoch 1053: avg test  loss 1527.88, bar  test loss 3.253, len  test loss 0.036, col  test loss 138.250


Epoch 1054: 272batch [00:37,  7.21batch/s, loss=1.56e+3]


epoch 1054: avg train loss 1514.69, bar train loss 3.425, len train loss 0.034, col train loss 136.529


Epoch 1055: 1batch [00:00,  8.13batch/s, loss=1.42e+3]

epoch 1054: avg test  loss 1531.21, bar  test loss 3.552, len  test loss 0.038, col  test loss 137.724


Epoch 1055: 272batch [00:37,  7.34batch/s, loss=1.61e+3]


epoch 1055: avg train loss 1515.98, bar train loss 3.540, len train loss 0.034, col train loss 136.497
epoch 1055: avg test  loss 1540.40, bar  test loss 3.879, len  test loss 0.039, col  test loss 138.780


Epoch 1056: 272batch [00:37,  7.29batch/s, loss=1.53e+3]


epoch 1056: avg train loss 1512.48, bar train loss 3.285, len train loss 0.035, col train loss 136.466


Epoch 1057: 1batch [00:00,  7.35batch/s, loss=1.48e+3]

epoch 1056: avg test  loss 1529.89, bar  test loss 3.370, len  test loss 0.034, col  test loss 138.335


Epoch 1057: 272batch [00:37,  7.25batch/s, loss=1.64e+3]


epoch 1057: avg train loss 1510.38, bar train loss 3.295, len train loss 0.036, col train loss 136.489


Epoch 1058: 1batch [00:00,  8.06batch/s, loss=1.55e+3]

epoch 1057: avg test  loss 1530.68, bar  test loss 3.462, len  test loss 0.038, col  test loss 138.114


Epoch 1058: 272batch [00:37,  7.28batch/s, loss=1.38e+3]


epoch 1058: avg train loss 1516.12, bar train loss 3.340, len train loss 0.035, col train loss 136.593


Epoch 1059: 1batch [00:00,  8.00batch/s, loss=1.52e+3]

epoch 1058: avg test  loss 1535.16, bar  test loss 3.690, len  test loss 0.040, col  test loss 137.945


Epoch 1059: 272batch [00:37,  7.29batch/s, loss=1.5e+3] 


epoch 1059: avg train loss 1511.73, bar train loss 3.210, len train loss 0.034, col train loss 136.188


Epoch 1060: 1batch [00:00,  8.20batch/s, loss=1.49e+3]

epoch 1059: avg test  loss 1525.75, bar  test loss 3.603, len  test loss 0.039, col  test loss 137.112


Epoch 1060: 272batch [00:37,  7.28batch/s, loss=1.42e+3]


epoch 1060: avg train loss 1513.56, bar train loss 3.274, len train loss 0.034, col train loss 136.239
epoch 1060: avg test  loss 1530.88, bar  test loss 3.295, len  test loss 0.043, col  test loss 138.319


Epoch 1061: 272batch [00:37,  7.21batch/s, loss=1.63e+3]


epoch 1061: avg train loss 1512.21, bar train loss 3.246, len train loss 0.034, col train loss 136.117


Epoch 1062: 1batch [00:00,  7.81batch/s, loss=1.51e+3]

epoch 1061: avg test  loss 1523.47, bar  test loss 3.276, len  test loss 0.037, col  test loss 137.273


Epoch 1062: 272batch [00:37,  7.26batch/s, loss=1.46e+3]


epoch 1062: avg train loss 1511.08, bar train loss 3.246, len train loss 0.034, col train loss 136.458


Epoch 1063: 1batch [00:00,  8.77batch/s, loss=1.44e+3]

epoch 1062: avg test  loss 1539.11, bar  test loss 4.397, len  test loss 0.037, col  test loss 137.727


Epoch 1063: 272batch [00:37,  7.25batch/s, loss=1.47e+3]


epoch 1063: avg train loss 1518.78, bar train loss 3.452, len train loss 0.039, col train loss 136.839


Epoch 1064: 1batch [00:00,  6.80batch/s, loss=1.48e+3]

epoch 1063: avg test  loss 1540.37, bar  test loss 4.317, len  test loss 0.040, col  test loss 137.866


Epoch 1064: 272batch [00:37,  7.18batch/s, loss=1.55e+3]


epoch 1064: avg train loss 1512.63, bar train loss 3.358, len train loss 0.033, col train loss 136.394


Epoch 1065: 1batch [00:00,  7.75batch/s, loss=1.5e+3]

epoch 1064: avg test  loss 1538.43, bar  test loss 3.644, len  test loss 0.038, col  test loss 138.961


Epoch 1065: 272batch [00:38,  7.15batch/s, loss=1.44e+3]


epoch 1065: avg train loss 1514.91, bar train loss 3.343, len train loss 0.036, col train loss 136.332
epoch 1065: avg test  loss 1525.94, bar  test loss 3.320, len  test loss 0.041, col  test loss 137.011


Epoch 1066: 272batch [00:37,  7.27batch/s, loss=1.64e+3]


epoch 1066: avg train loss 1517.27, bar train loss 3.495, len train loss 0.037, col train loss 136.730


Epoch 1067: 1batch [00:00,  7.75batch/s, loss=1.5e+3]

epoch 1066: avg test  loss 1532.56, bar  test loss 3.707, len  test loss 0.036, col  test loss 137.326


Epoch 1067: 272batch [00:37,  7.22batch/s, loss=1.49e+3]


epoch 1067: avg train loss 1513.73, bar train loss 3.235, len train loss 0.032, col train loss 136.588


Epoch 1068: 1batch [00:00,  7.75batch/s, loss=1.44e+3]

epoch 1067: avg test  loss 1530.54, bar  test loss 3.391, len  test loss 0.036, col  test loss 138.298


Epoch 1068: 272batch [00:37,  7.34batch/s, loss=1.48e+3]


epoch 1068: avg train loss 1515.45, bar train loss 3.336, len train loss 0.036, col train loss 136.651


Epoch 1069: 1batch [00:00,  8.13batch/s, loss=1.49e+3]

epoch 1068: avg test  loss 1523.69, bar  test loss 3.431, len  test loss 0.041, col  test loss 137.107


Epoch 1069: 272batch [00:37,  7.29batch/s, loss=1.57e+3]


epoch 1069: avg train loss 1513.44, bar train loss 3.335, len train loss 0.034, col train loss 136.374


Epoch 1070: 1batch [00:00,  8.00batch/s, loss=1.49e+3]

epoch 1069: avg test  loss 1533.91, bar  test loss 3.415, len  test loss 0.036, col  test loss 138.145


Epoch 1070: 272batch [00:37,  7.23batch/s, loss=1.51e+3]


epoch 1070: avg train loss 1515.66, bar train loss 3.305, len train loss 0.035, col train loss 136.423
epoch 1070: avg test  loss 1531.41, bar  test loss 3.448, len  test loss 0.038, col  test loss 137.441


Epoch 1071: 272batch [00:37,  7.23batch/s, loss=1.57e+3]


epoch 1071: avg train loss 1514.05, bar train loss 3.319, len train loss 0.036, col train loss 136.544


Epoch 1072: 1batch [00:00,  8.33batch/s, loss=1.55e+3]

epoch 1071: avg test  loss 1528.48, bar  test loss 3.486, len  test loss 0.038, col  test loss 137.886


Epoch 1072: 272batch [00:37,  7.25batch/s, loss=1.57e+3]


epoch 1072: avg train loss 1517.16, bar train loss 3.267, len train loss 0.035, col train loss 137.137


Epoch 1073: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1072: avg test  loss 1555.78, bar  test loss 3.803, len  test loss 0.049, col  test loss 141.446


Epoch 1073: 272batch [00:37,  7.24batch/s, loss=1.45e+3]


epoch 1073: avg train loss 1520.24, bar train loss 3.466, len train loss 0.036, col train loss 136.967


Epoch 1074: 1batch [00:00,  8.40batch/s, loss=1.54e+3]

epoch 1073: avg test  loss 1530.57, bar  test loss 3.768, len  test loss 0.035, col  test loss 137.683


Epoch 1074: 272batch [00:37,  7.26batch/s, loss=1.7e+3] 


epoch 1074: avg train loss 1514.86, bar train loss 3.323, len train loss 0.033, col train loss 136.744


Epoch 1075: 1batch [00:00,  8.06batch/s, loss=1.56e+3]

epoch 1074: avg test  loss 1530.16, bar  test loss 3.808, len  test loss 0.036, col  test loss 137.400


Epoch 1075: 272batch [00:37,  7.18batch/s, loss=1.5e+3] 


epoch 1075: avg train loss 1518.75, bar train loss 3.388, len train loss 0.035, col train loss 136.837
epoch 1075: avg test  loss 1526.92, bar  test loss 3.552, len  test loss 0.034, col  test loss 137.561


Epoch 1076: 272batch [00:37,  7.17batch/s, loss=1.39e+3]


epoch 1076: avg train loss 1513.57, bar train loss 3.308, len train loss 0.034, col train loss 136.618


Epoch 1077: 1batch [00:00,  7.87batch/s, loss=1.52e+3]

epoch 1076: avg test  loss 1522.56, bar  test loss 3.260, len  test loss 0.032, col  test loss 137.436


Epoch 1077: 272batch [00:37,  7.21batch/s, loss=1.59e+3]


epoch 1077: avg train loss 1516.86, bar train loss 3.247, len train loss 0.034, col train loss 136.886


Epoch 1078: 1batch [00:00,  8.06batch/s, loss=1.42e+3]

epoch 1077: avg test  loss 1534.29, bar  test loss 3.528, len  test loss 0.037, col  test loss 138.712


Epoch 1078: 272batch [00:37,  7.23batch/s, loss=1.59e+3]


epoch 1078: avg train loss 1519.84, bar train loss 3.257, len train loss 0.033, col train loss 137.221


Epoch 1079: 1batch [00:00,  7.75batch/s, loss=1.49e+3]

epoch 1078: avg test  loss 1533.79, bar  test loss 3.334, len  test loss 0.045, col  test loss 138.481


Epoch 1079: 272batch [00:38,  7.15batch/s, loss=1.62e+3]


epoch 1079: avg train loss 1518.57, bar train loss 3.438, len train loss 0.034, col train loss 136.826


Epoch 1080: 1batch [00:00,  8.93batch/s, loss=1.53e+3]

epoch 1079: avg test  loss 1540.33, bar  test loss 3.990, len  test loss 0.037, col  test loss 138.648


Epoch 1080: 272batch [00:37,  7.24batch/s, loss=1.43e+3]


epoch 1080: avg train loss 1517.82, bar train loss 3.392, len train loss 0.035, col train loss 136.927
epoch 1080: avg test  loss 1529.35, bar  test loss 3.269, len  test loss 0.034, col  test loss 138.158


Epoch 1081: 272batch [00:37,  7.18batch/s, loss=1.51e+3]


epoch 1081: avg train loss 1518.60, bar train loss 3.256, len train loss 0.037, col train loss 136.815


Epoch 1082: 1batch [00:00,  7.52batch/s, loss=1.55e+3]

epoch 1081: avg test  loss 1531.03, bar  test loss 3.601, len  test loss 0.039, col  test loss 138.431


Epoch 1082: 272batch [00:37,  7.20batch/s, loss=1.55e+3]


epoch 1082: avg train loss 1515.33, bar train loss 3.271, len train loss 0.036, col train loss 136.693


Epoch 1083: 1batch [00:00,  7.52batch/s, loss=1.54e+3]

epoch 1082: avg test  loss 1534.03, bar  test loss 3.544, len  test loss 0.040, col  test loss 137.735


Epoch 1083: 272batch [00:37,  7.20batch/s, loss=1.51e+3]


epoch 1083: avg train loss 1516.23, bar train loss 3.267, len train loss 0.035, col train loss 136.724


Epoch 1084: 1batch [00:00,  7.41batch/s, loss=1.58e+3]

epoch 1083: avg test  loss 1537.36, bar  test loss 4.160, len  test loss 0.045, col  test loss 138.163


Epoch 1084: 272batch [00:37,  7.18batch/s, loss=1.45e+3]


epoch 1084: avg train loss 1515.64, bar train loss 3.293, len train loss 0.035, col train loss 136.836


Epoch 1085: 1batch [00:00,  8.26batch/s, loss=1.53e+3]

epoch 1084: avg test  loss 1542.42, bar  test loss 3.861, len  test loss 0.049, col  test loss 138.538


Epoch 1085: 272batch [00:37,  7.19batch/s, loss=1.55e+3]


epoch 1085: avg train loss 1519.86, bar train loss 3.430, len train loss 0.036, col train loss 137.265
epoch 1085: avg test  loss 1535.65, bar  test loss 3.692, len  test loss 0.042, col  test loss 138.045


Epoch 1086: 272batch [00:38,  7.15batch/s, loss=1.54e+3]


epoch 1086: avg train loss 1515.60, bar train loss 3.395, len train loss 0.035, col train loss 136.731


Epoch 1087: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 1086: avg test  loss 1531.70, bar  test loss 3.453, len  test loss 0.034, col  test loss 138.654


Epoch 1087: 272batch [00:37,  7.17batch/s, loss=1.57e+3]


epoch 1087: avg train loss 1518.62, bar train loss 3.487, len train loss 0.035, col train loss 137.102


Epoch 1088: 1batch [00:00,  7.69batch/s, loss=1.54e+3]

epoch 1087: avg test  loss 1542.35, bar  test loss 3.986, len  test loss 0.036, col  test loss 137.864


Epoch 1088: 272batch [00:37,  7.17batch/s, loss=1.54e+3]


epoch 1088: avg train loss 1523.19, bar train loss 3.467, len train loss 0.033, col train loss 137.113


Epoch 1089: 1batch [00:00,  8.40batch/s, loss=1.6e+3]

epoch 1088: avg test  loss 1538.77, bar  test loss 3.464, len  test loss 0.037, col  test loss 138.282


Epoch 1089: 272batch [00:37,  7.20batch/s, loss=1.5e+3] 


epoch 1089: avg train loss 1520.88, bar train loss 3.372, len train loss 0.035, col train loss 137.234


Epoch 1090: 1batch [00:00,  7.46batch/s, loss=1.54e+3]

epoch 1089: avg test  loss 1544.41, bar  test loss 4.115, len  test loss 0.037, col  test loss 138.895


Epoch 1090: 272batch [00:37,  7.17batch/s, loss=1.59e+3]


epoch 1090: avg train loss 1524.41, bar train loss 3.326, len train loss 0.036, col train loss 137.753
epoch 1090: avg test  loss 1535.02, bar  test loss 3.562, len  test loss 0.037, col  test loss 138.261


Epoch 1091: 272batch [00:37,  7.18batch/s, loss=1.58e+3]


epoch 1091: avg train loss 1521.65, bar train loss 3.288, len train loss 0.034, col train loss 137.364


Epoch 1092: 1batch [00:00,  8.20batch/s, loss=1.53e+3]

epoch 1091: avg test  loss 1540.39, bar  test loss 3.393, len  test loss 0.037, col  test loss 139.374


Epoch 1092: 272batch [00:39,  6.97batch/s, loss=1.63e+3]


epoch 1092: avg train loss 1522.26, bar train loss 3.394, len train loss 0.034, col train loss 137.449


Epoch 1093: 1batch [00:00,  6.62batch/s, loss=1.48e+3]

epoch 1092: avg test  loss 1534.89, bar  test loss 3.401, len  test loss 0.035, col  test loss 137.832


Epoch 1093: 272batch [00:42,  6.46batch/s, loss=1.54e+3]


epoch 1093: avg train loss 1519.14, bar train loss 3.267, len train loss 0.034, col train loss 137.030


Epoch 1094: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 1093: avg test  loss 1529.75, bar  test loss 3.556, len  test loss 0.037, col  test loss 137.999


Epoch 1094: 272batch [00:40,  6.78batch/s, loss=1.61e+3]


epoch 1094: avg train loss 1521.08, bar train loss 3.454, len train loss 0.034, col train loss 137.284


Epoch 1095: 1batch [00:00,  7.63batch/s, loss=1.56e+3]

epoch 1094: avg test  loss 1543.78, bar  test loss 4.425, len  test loss 0.036, col  test loss 138.141


Epoch 1095: 272batch [00:39,  6.81batch/s, loss=1.53e+3]


epoch 1095: avg train loss 1520.23, bar train loss 3.451, len train loss 0.035, col train loss 137.119
epoch 1095: avg test  loss 1535.94, bar  test loss 3.677, len  test loss 0.037, col  test loss 138.618


Epoch 1096: 272batch [00:41,  6.49batch/s, loss=1.35e+3]


epoch 1096: avg train loss 1520.43, bar train loss 3.461, len train loss 0.035, col train loss 137.342


Epoch 1097: 1batch [00:00,  7.19batch/s, loss=1.49e+3]

epoch 1096: avg test  loss 1538.34, bar  test loss 3.624, len  test loss 0.037, col  test loss 137.955


Epoch 1097: 272batch [00:40,  6.72batch/s, loss=1.56e+3]


epoch 1097: avg train loss 1523.47, bar train loss 3.531, len train loss 0.035, col train loss 137.633


Epoch 1098: 1batch [00:00,  7.41batch/s, loss=1.46e+3]

epoch 1097: avg test  loss 1527.77, bar  test loss 3.241, len  test loss 0.038, col  test loss 138.254


Epoch 1098: 272batch [00:40,  6.73batch/s, loss=1.61e+3]


epoch 1098: avg train loss 1518.47, bar train loss 3.300, len train loss 0.036, col train loss 137.151


Epoch 1099: 1batch [00:00,  7.52batch/s, loss=1.51e+3]

epoch 1098: avg test  loss 1530.57, bar  test loss 3.507, len  test loss 0.039, col  test loss 138.018


Epoch 1099: 272batch [00:39,  6.80batch/s, loss=1.54e+3]


epoch 1099: avg train loss 1521.68, bar train loss 3.488, len train loss 0.037, col train loss 137.278


Epoch 1100: 1batch [00:00,  7.69batch/s, loss=1.57e+3]

epoch 1099: avg test  loss 1550.58, bar  test loss 3.843, len  test loss 0.042, col  test loss 139.646


Epoch 1100: 272batch [00:40,  6.67batch/s, loss=1.55e+3]


epoch 1100: avg train loss 1518.51, bar train loss 3.377, len train loss 0.035, col train loss 136.901
epoch 1100: avg test  loss 1536.39, bar  test loss 3.800, len  test loss 0.036, col  test loss 137.667


Epoch 1101: 272batch [00:42,  6.40batch/s, loss=1.59e+3]


epoch 1101: avg train loss 1521.39, bar train loss 3.370, len train loss 0.036, col train loss 137.209


Epoch 1102: 1batch [00:00,  6.99batch/s, loss=1.53e+3]

epoch 1101: avg test  loss 1534.10, bar  test loss 3.269, len  test loss 0.035, col  test loss 138.419


Epoch 1102: 272batch [00:40,  6.76batch/s, loss=1.47e+3]


epoch 1102: avg train loss 1522.85, bar train loss 3.426, len train loss 0.038, col train loss 137.495


Epoch 1103: 1batch [00:00,  7.63batch/s, loss=1.6e+3]

epoch 1102: avg test  loss 1541.83, bar  test loss 3.641, len  test loss 0.043, col  test loss 140.380


Epoch 1103: 272batch [00:40,  6.73batch/s, loss=1.87e+3]


epoch 1103: avg train loss 1522.92, bar train loss 3.340, len train loss 0.034, col train loss 137.658


Epoch 1104: 0batch [00:00, ?batch/s]

epoch 1103: avg test  loss 1538.48, bar  test loss 3.514, len  test loss 0.037, col  test loss 138.813


Epoch 1104: 272batch [00:40,  6.71batch/s, loss=1.44e+3]


epoch 1104: avg train loss 1520.11, bar train loss 3.427, len train loss 0.033, col train loss 137.461


Epoch 1105: 1batch [00:00,  7.58batch/s, loss=1.55e+3]

epoch 1104: avg test  loss 1536.63, bar  test loss 3.255, len  test loss 0.035, col  test loss 138.903


Epoch 1105: 272batch [00:40,  6.75batch/s, loss=1.58e+3]


epoch 1105: avg train loss 1521.36, bar train loss 3.403, len train loss 0.033, col train loss 137.344
epoch 1105: avg test  loss 1549.87, bar  test loss 4.703, len  test loss 0.035, col  test loss 138.955


Epoch 1106: 272batch [00:42,  6.42batch/s, loss=1.53e+3]


epoch 1106: avg train loss 1520.74, bar train loss 3.364, len train loss 0.033, col train loss 137.239


Epoch 1107: 1batch [00:00,  7.04batch/s, loss=1.54e+3]

epoch 1106: avg test  loss 1537.88, bar  test loss 3.706, len  test loss 0.035, col  test loss 138.885


Epoch 1107: 272batch [00:40,  6.75batch/s, loss=1.54e+3]


epoch 1107: avg train loss 1521.80, bar train loss 3.609, len train loss 0.034, col train loss 137.046


Epoch 1108: 0batch [00:00, ?batch/s]

epoch 1107: avg test  loss 1532.07, bar  test loss 3.446, len  test loss 0.032, col  test loss 138.634


Epoch 1108: 272batch [00:40,  6.75batch/s, loss=1.62e+3]


epoch 1108: avg train loss 1521.05, bar train loss 3.281, len train loss 0.034, col train loss 137.135


Epoch 1109: 1batch [00:00,  7.46batch/s, loss=1.55e+3]

epoch 1108: avg test  loss 1543.59, bar  test loss 3.946, len  test loss 0.038, col  test loss 138.894


Epoch 1109: 272batch [00:40,  6.77batch/s, loss=1.48e+3]


epoch 1109: avg train loss 1523.05, bar train loss 3.391, len train loss 0.035, col train loss 137.536


Epoch 1110: 1batch [00:00,  7.63batch/s, loss=1.59e+3]

epoch 1109: avg test  loss 1528.28, bar  test loss 3.321, len  test loss 0.035, col  test loss 137.705


Epoch 1110: 272batch [00:40,  6.69batch/s, loss=1.66e+3]


epoch 1110: avg train loss 1521.04, bar train loss 3.351, len train loss 0.035, col train loss 137.314
epoch 1110: avg test  loss 1539.34, bar  test loss 3.449, len  test loss 0.039, col  test loss 138.700


Epoch 1111: 272batch [00:42,  6.39batch/s, loss=1.4e+3] 


epoch 1111: avg train loss 1521.64, bar train loss 3.390, len train loss 0.036, col train loss 137.399


Epoch 1112: 1batch [00:00,  7.41batch/s, loss=1.56e+3]

epoch 1111: avg test  loss 1534.52, bar  test loss 3.546, len  test loss 0.037, col  test loss 137.874


Epoch 1112: 272batch [00:40,  6.73batch/s, loss=1.61e+3]


epoch 1112: avg train loss 1524.48, bar train loss 3.530, len train loss 0.035, col train loss 137.581


Epoch 1113: 1batch [00:00,  7.75batch/s, loss=1.48e+3]

epoch 1112: avg test  loss 1534.14, bar  test loss 3.360, len  test loss 0.034, col  test loss 138.985


Epoch 1113: 272batch [00:40,  6.76batch/s, loss=1.61e+3]


epoch 1113: avg train loss 1522.90, bar train loss 3.612, len train loss 0.034, col train loss 137.219


Epoch 1114: 1batch [00:00,  7.41batch/s, loss=1.54e+3]

epoch 1113: avg test  loss 1531.30, bar  test loss 3.529, len  test loss 0.038, col  test loss 138.121


Epoch 1114: 272batch [00:40,  6.72batch/s, loss=1.46e+3]


epoch 1114: avg train loss 1517.55, bar train loss 3.331, len train loss 0.035, col train loss 137.076


Epoch 1115: 1batch [00:00,  7.75batch/s, loss=1.53e+3]

epoch 1114: avg test  loss 1540.87, bar  test loss 4.136, len  test loss 0.036, col  test loss 138.071


Epoch 1115: 272batch [00:40,  6.73batch/s, loss=1.54e+3]


epoch 1115: avg train loss 1524.16, bar train loss 3.519, len train loss 0.036, col train loss 137.639
epoch 1115: avg test  loss 1541.91, bar  test loss 3.800, len  test loss 0.051, col  test loss 139.920


Epoch 1116: 272batch [00:43,  6.31batch/s, loss=1.55e+3]


epoch 1116: avg train loss 1518.71, bar train loss 3.351, len train loss 0.036, col train loss 137.138


Epoch 1117: 1batch [00:00,  7.69batch/s, loss=1.47e+3]

epoch 1116: avg test  loss 1541.44, bar  test loss 3.783, len  test loss 0.036, col  test loss 138.915


Epoch 1117: 272batch [00:40,  6.70batch/s, loss=1.56e+3]


epoch 1117: avg train loss 1525.05, bar train loss 3.456, len train loss 0.036, col train loss 137.804


Epoch 1118: 0batch [00:00, ?batch/s, loss=1.5e+3]

epoch 1117: avg test  loss 1548.61, bar  test loss 4.097, len  test loss 0.038, col  test loss 139.608


Epoch 1118: 272batch [00:40,  6.72batch/s, loss=1.49e+3]


epoch 1118: avg train loss 1528.46, bar train loss 3.410, len train loss 0.037, col train loss 137.956


Epoch 1119: 1batch [00:00,  7.87batch/s, loss=1.52e+3]

epoch 1118: avg test  loss 1537.08, bar  test loss 3.454, len  test loss 0.037, col  test loss 138.313


Epoch 1119: 272batch [00:40,  6.74batch/s, loss=1.58e+3]


epoch 1119: avg train loss 1520.56, bar train loss 3.311, len train loss 0.035, col train loss 137.254


Epoch 1120: 0batch [00:00, ?batch/s]

epoch 1119: avg test  loss 1538.52, bar  test loss 3.721, len  test loss 0.035, col  test loss 139.158


Epoch 1120: 272batch [00:40,  6.70batch/s, loss=1.59e+3]


epoch 1120: avg train loss 1528.79, bar train loss 3.440, len train loss 0.034, col train loss 138.207
epoch 1120: avg test  loss 1545.67, bar  test loss 3.782, len  test loss 0.035, col  test loss 139.931


Epoch 1121: 272batch [00:42,  6.35batch/s, loss=1.49e+3]


epoch 1121: avg train loss 1526.74, bar train loss 3.404, len train loss 0.033, col train loss 137.779


Epoch 1122: 1batch [00:00,  8.00batch/s, loss=1.5e+3]

epoch 1121: avg test  loss 1538.30, bar  test loss 3.658, len  test loss 0.035, col  test loss 138.600


Epoch 1122: 272batch [00:40,  6.68batch/s, loss=1.45e+3]


epoch 1122: avg train loss 1521.18, bar train loss 3.333, len train loss 0.034, col train loss 137.464


Epoch 1123: 1batch [00:00,  7.81batch/s, loss=1.48e+3]

epoch 1122: avg test  loss 1539.47, bar  test loss 3.676, len  test loss 0.038, col  test loss 138.930


Epoch 1123: 272batch [00:40,  6.68batch/s, loss=1.5e+3] 


epoch 1123: avg train loss 1525.67, bar train loss 3.525, len train loss 0.035, col train loss 138.051


Epoch 1124: 1batch [00:00,  6.54batch/s, loss=1.55e+3]

epoch 1123: avg test  loss 1537.53, bar  test loss 3.438, len  test loss 0.038, col  test loss 139.281


Epoch 1124: 272batch [00:40,  6.65batch/s, loss=1.57e+3]


epoch 1124: avg train loss 1524.90, bar train loss 3.399, len train loss 0.034, col train loss 137.763


Epoch 1125: 0batch [00:00, ?batch/s]

epoch 1124: avg test  loss 1557.18, bar  test loss 5.076, len  test loss 0.035, col  test loss 139.035


Epoch 1125: 272batch [00:41,  6.63batch/s, loss=1.6e+3] 


epoch 1125: avg train loss 1527.08, bar train loss 3.457, len train loss 0.035, col train loss 137.971
epoch 1125: avg test  loss 1543.91, bar  test loss 3.645, len  test loss 0.038, col  test loss 139.476


Epoch 1126: 272batch [00:43,  6.31batch/s, loss=1.48e+3]


epoch 1126: avg train loss 1526.17, bar train loss 3.463, len train loss 0.036, col train loss 137.976


Epoch 1127: 1batch [00:00,  7.14batch/s, loss=1.56e+3]

epoch 1126: avg test  loss 1555.50, bar  test loss 5.649, len  test loss 0.039, col  test loss 139.337


Epoch 1127: 272batch [00:40,  6.67batch/s, loss=1.53e+3]


epoch 1127: avg train loss 1526.76, bar train loss 3.634, len train loss 0.035, col train loss 138.057


Epoch 1128: 1batch [00:00,  8.47batch/s, loss=1.52e+3]

epoch 1127: avg test  loss 1541.09, bar  test loss 4.365, len  test loss 0.038, col  test loss 138.979


Epoch 1128: 272batch [00:40,  6.69batch/s, loss=1.47e+3]


epoch 1128: avg train loss 1520.73, bar train loss 3.334, len train loss 0.035, col train loss 137.368


Epoch 1129: 0batch [00:00, ?batch/s, loss=1.48e+3]

epoch 1128: avg test  loss 1537.26, bar  test loss 4.341, len  test loss 0.036, col  test loss 138.313


Epoch 1129: 272batch [00:40,  6.67batch/s, loss=1.48e+3]


epoch 1129: avg train loss 1521.87, bar train loss 3.524, len train loss 0.034, col train loss 137.473


Epoch 1130: 0batch [00:00, ?batch/s, loss=1.5e+3]

epoch 1129: avg test  loss 1540.65, bar  test loss 3.566, len  test loss 0.038, col  test loss 140.002


Epoch 1130: 272batch [00:40,  6.66batch/s, loss=1.48e+3]


epoch 1130: avg train loss 1524.22, bar train loss 3.339, len train loss 0.033, col train loss 137.513
epoch 1130: avg test  loss 1542.55, bar  test loss 3.354, len  test loss 0.040, col  test loss 140.286


Epoch 1131: 272batch [00:42,  6.36batch/s, loss=1.63e+3]


epoch 1131: avg train loss 1524.89, bar train loss 3.460, len train loss 0.035, col train loss 137.478


Epoch 1132: 1batch [00:00,  8.07batch/s, loss=1.57e+3]

epoch 1131: avg test  loss 1536.01, bar  test loss 3.754, len  test loss 0.036, col  test loss 138.343


Epoch 1132: 272batch [00:40,  6.66batch/s, loss=1.57e+3]


epoch 1132: avg train loss 1524.21, bar train loss 3.305, len train loss 0.034, col train loss 137.964


Epoch 1133: 0batch [00:00, ?batch/s, loss=1.47e+3]

epoch 1132: avg test  loss 1535.71, bar  test loss 3.645, len  test loss 0.035, col  test loss 138.555


Epoch 1133: 272batch [00:41,  6.63batch/s, loss=1.45e+3]


epoch 1133: avg train loss 1524.86, bar train loss 3.358, len train loss 0.035, col train loss 137.584


Epoch 1134: 1batch [00:00,  7.81batch/s, loss=1.55e+3]

epoch 1133: avg test  loss 1575.51, bar  test loss 6.284, len  test loss 0.044, col  test loss 139.214


Epoch 1134: 272batch [00:40,  6.68batch/s, loss=1.69e+3]


epoch 1134: avg train loss 1528.30, bar train loss 3.413, len train loss 0.035, col train loss 137.989


Epoch 1135: 1batch [00:00,  8.20batch/s, loss=1.56e+3]

epoch 1134: avg test  loss 1546.77, bar  test loss 3.727, len  test loss 0.044, col  test loss 139.781


Epoch 1135: 272batch [00:41,  6.63batch/s, loss=1.72e+3]


epoch 1135: avg train loss 1528.22, bar train loss 3.499, len train loss 0.034, col train loss 137.910
epoch 1135: avg test  loss 1592.61, bar  test loss 8.118, len  test loss 0.039, col  test loss 140.841


Epoch 1136: 272batch [00:42,  6.33batch/s, loss=1.46e+3]


epoch 1136: avg train loss 1530.83, bar train loss 3.637, len train loss 0.038, col train loss 138.277


Epoch 1137: 1batch [00:00,  7.63batch/s, loss=1.48e+3]

epoch 1136: avg test  loss 1539.82, bar  test loss 3.348, len  test loss 0.035, col  test loss 138.338


Epoch 1137: 272batch [00:40,  6.67batch/s, loss=1.58e+3]


epoch 1137: avg train loss 1527.27, bar train loss 3.436, len train loss 0.036, col train loss 137.706


Epoch 1138: 1batch [00:00,  7.35batch/s, loss=1.53e+3]

epoch 1137: avg test  loss 1550.43, bar  test loss 4.433, len  test loss 0.038, col  test loss 138.904


Epoch 1138: 272batch [00:40,  6.65batch/s, loss=1.75e+3]


epoch 1138: avg train loss 1523.09, bar train loss 3.515, len train loss 0.036, col train loss 137.494


Epoch 1139: 1batch [00:00,  7.94batch/s, loss=1.56e+3]

epoch 1138: avg test  loss 1540.32, bar  test loss 3.587, len  test loss 0.047, col  test loss 139.271


Epoch 1139: 272batch [00:41,  6.62batch/s, loss=1.52e+3]


epoch 1139: avg train loss 1524.54, bar train loss 3.335, len train loss 0.033, col train loss 137.451


Epoch 1140: 1batch [00:00,  7.58batch/s, loss=1.47e+3]

epoch 1139: avg test  loss 1534.59, bar  test loss 3.395, len  test loss 0.035, col  test loss 138.837


Epoch 1140: 272batch [00:40,  6.64batch/s, loss=1.63e+3]


epoch 1140: avg train loss 1525.65, bar train loss 3.430, len train loss 0.035, col train loss 137.960
epoch 1140: avg test  loss 1544.92, bar  test loss 4.109, len  test loss 0.041, col  test loss 139.382


Epoch 1141: 272batch [00:43,  6.32batch/s, loss=1.69e+3]


epoch 1141: avg train loss 1530.90, bar train loss 3.497, len train loss 0.036, col train loss 138.175


Epoch 1142: 1batch [00:00,  7.63batch/s, loss=1.51e+3]

epoch 1141: avg test  loss 1546.89, bar  test loss 3.774, len  test loss 0.050, col  test loss 140.348


Epoch 1142: 272batch [00:40,  6.64batch/s, loss=1.65e+3]


epoch 1142: avg train loss 1527.53, bar train loss 3.344, len train loss 0.037, col train loss 138.134


Epoch 1143: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1142: avg test  loss 1548.02, bar  test loss 3.648, len  test loss 0.036, col  test loss 139.606


Epoch 1143: 272batch [00:41,  6.61batch/s, loss=1.48e+3]


epoch 1143: avg train loss 1528.93, bar train loss 3.477, len train loss 0.035, col train loss 138.063


Epoch 1144: 1batch [00:00,  6.49batch/s, loss=1.5e+3]

epoch 1143: avg test  loss 1549.93, bar  test loss 3.933, len  test loss 0.037, col  test loss 140.129


Epoch 1144: 272batch [00:41,  6.61batch/s, loss=1.5e+3] 


epoch 1144: avg train loss 1527.92, bar train loss 3.548, len train loss 0.037, col train loss 137.762


Epoch 1145: 1batch [00:00,  8.07batch/s, loss=1.52e+3]

epoch 1144: avg test  loss 1550.16, bar  test loss 3.569, len  test loss 0.044, col  test loss 140.182


Epoch 1145: 272batch [00:41,  6.58batch/s, loss=1.53e+3]


epoch 1145: avg train loss 1529.41, bar train loss 3.473, len train loss 0.037, col train loss 137.908
epoch 1145: avg test  loss 1553.07, bar  test loss 4.101, len  test loss 0.042, col  test loss 140.392


Epoch 1146: 272batch [00:43,  6.27batch/s, loss=1.63e+3]


epoch 1146: avg train loss 1527.84, bar train loss 3.394, len train loss 0.035, col train loss 138.052


Epoch 1147: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1146: avg test  loss 1537.21, bar  test loss 3.826, len  test loss 0.034, col  test loss 138.521


Epoch 1147: 272batch [00:40,  6.65batch/s, loss=1.52e+3]


epoch 1147: avg train loss 1528.63, bar train loss 3.527, len train loss 0.034, col train loss 137.989


Epoch 1148: 0batch [00:00, ?batch/s, loss=1.5e+3]

epoch 1147: avg test  loss 1537.22, bar  test loss 3.404, len  test loss 0.035, col  test loss 138.812


Epoch 1148: 272batch [00:40,  6.67batch/s, loss=1.38e+3]


epoch 1148: avg train loss 1527.71, bar train loss 3.513, len train loss 0.035, col train loss 138.046


Epoch 1149: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 1148: avg test  loss 1538.42, bar  test loss 3.786, len  test loss 0.038, col  test loss 138.992


Epoch 1149: 272batch [00:41,  6.58batch/s, loss=1.43e+3]


epoch 1149: avg train loss 1527.88, bar train loss 3.504, len train loss 0.036, col train loss 138.154


Epoch 1150: 0batch [00:00, ?batch/s, loss=1.47e+3]

epoch 1149: avg test  loss 1549.58, bar  test loss 3.919, len  test loss 0.051, col  test loss 139.606


Epoch 1150: 272batch [00:41,  6.59batch/s, loss=1.52e+3]


epoch 1150: avg train loss 1531.74, bar train loss 3.556, len train loss 0.038, col train loss 138.366
epoch 1150: avg test  loss 1541.03, bar  test loss 3.397, len  test loss 0.038, col  test loss 139.652


Epoch 1151: 272batch [00:42,  6.34batch/s, loss=1.66e+3]


epoch 1151: avg train loss 1532.65, bar train loss 3.473, len train loss 0.037, col train loss 138.542


Epoch 1152: 1batch [00:00,  7.52batch/s, loss=1.51e+3]

epoch 1151: avg test  loss 1548.86, bar  test loss 3.662, len  test loss 0.037, col  test loss 139.377


Epoch 1152: 272batch [00:41,  6.61batch/s, loss=1.61e+3]


epoch 1152: avg train loss 1531.01, bar train loss 3.489, len train loss 0.037, col train loss 137.875


Epoch 1153: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1152: avg test  loss 1557.41, bar  test loss 5.266, len  test loss 0.036, col  test loss 139.237


Epoch 1153: 272batch [00:41,  6.62batch/s, loss=1.38e+3]


epoch 1153: avg train loss 1531.68, bar train loss 3.482, len train loss 0.035, col train loss 138.810


Epoch 1154: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1153: avg test  loss 1560.80, bar  test loss 5.686, len  test loss 0.034, col  test loss 139.330


Epoch 1154: 272batch [00:41,  6.61batch/s, loss=1.54e+3]


epoch 1154: avg train loss 1529.13, bar train loss 3.479, len train loss 0.034, col train loss 137.762


Epoch 1155: 1batch [00:00,  7.63batch/s, loss=1.55e+3]

epoch 1154: avg test  loss 1546.70, bar  test loss 3.494, len  test loss 0.039, col  test loss 139.426


Epoch 1155: 272batch [00:41,  6.61batch/s, loss=1.49e+3]


epoch 1155: avg train loss 1526.80, bar train loss 3.352, len train loss 0.033, col train loss 137.863
epoch 1155: avg test  loss 1539.34, bar  test loss 3.550, len  test loss 0.039, col  test loss 139.638


Epoch 1156: 272batch [00:44,  6.16batch/s, loss=1.54e+3]


epoch 1156: avg train loss 1532.79, bar train loss 3.648, len train loss 0.036, col train loss 138.280


Epoch 1157: 1batch [00:00,  7.58batch/s, loss=1.52e+3]

epoch 1156: avg test  loss 1560.11, bar  test loss 4.812, len  test loss 0.037, col  test loss 139.488


Epoch 1157: 272batch [00:41,  6.61batch/s, loss=1.58e+3]


epoch 1157: avg train loss 1531.59, bar train loss 3.407, len train loss 0.036, col train loss 138.244


Epoch 1158: 1batch [00:00,  7.41batch/s, loss=1.58e+3]

epoch 1157: avg test  loss 1548.49, bar  test loss 3.576, len  test loss 0.038, col  test loss 140.072


Epoch 1158: 272batch [00:41,  6.63batch/s, loss=1.49e+3]


epoch 1158: avg train loss 1530.24, bar train loss 3.408, len train loss 0.035, col train loss 138.082


Epoch 1159: 1batch [00:00,  7.63batch/s, loss=1.57e+3]

epoch 1158: avg test  loss 1547.55, bar  test loss 3.443, len  test loss 0.037, col  test loss 140.058


Epoch 1159: 272batch [00:41,  6.62batch/s, loss=1.43e+3]


epoch 1159: avg train loss 1535.49, bar train loss 3.635, len train loss 0.036, col train loss 138.549


Epoch 1160: 1batch [00:00,  7.75batch/s, loss=1.63e+3]

epoch 1159: avg test  loss 1554.72, bar  test loss 3.686, len  test loss 0.044, col  test loss 140.599


Epoch 1160: 272batch [00:40,  6.65batch/s, loss=1.62e+3]


epoch 1160: avg train loss 1530.18, bar train loss 3.471, len train loss 0.035, col train loss 138.074
epoch 1160: avg test  loss 1545.15, bar  test loss 3.582, len  test loss 0.035, col  test loss 140.104


Epoch 1161: 272batch [00:43,  6.23batch/s, loss=1.55e+3]


epoch 1161: avg train loss 1530.02, bar train loss 3.468, len train loss 0.034, col train loss 138.005


Epoch 1162: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1161: avg test  loss 1537.22, bar  test loss 3.579, len  test loss 0.036, col  test loss 138.906


Epoch 1162: 272batch [00:41,  6.57batch/s, loss=1.54e+3]


epoch 1162: avg train loss 1528.51, bar train loss 3.444, len train loss 0.035, col train loss 138.111


Epoch 1163: 0batch [00:00, ?batch/s, loss=1.48e+3]

epoch 1162: avg test  loss 1546.85, bar  test loss 3.703, len  test loss 0.036, col  test loss 140.046


Epoch 1163: 272batch [00:41,  6.58batch/s, loss=1.51e+3]


epoch 1163: avg train loss 1530.89, bar train loss 3.616, len train loss 0.034, col train loss 138.029


Epoch 1164: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1163: avg test  loss 1546.13, bar  test loss 3.860, len  test loss 0.038, col  test loss 140.123


Epoch 1164: 272batch [00:41,  6.56batch/s, loss=1.55e+3]


epoch 1164: avg train loss 1532.37, bar train loss 3.549, len train loss 0.035, col train loss 138.156


Epoch 1165: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1164: avg test  loss 1544.46, bar  test loss 3.678, len  test loss 0.035, col  test loss 139.249


Epoch 1165: 272batch [00:41,  6.58batch/s, loss=1.41e+3]


epoch 1165: avg train loss 1531.36, bar train loss 3.316, len train loss 0.034, col train loss 138.598
epoch 1165: avg test  loss 1542.34, bar  test loss 3.463, len  test loss 0.035, col  test loss 138.914


Epoch 1166: 272batch [00:43,  6.23batch/s, loss=1.52e+3]


epoch 1166: avg train loss 1530.21, bar train loss 3.486, len train loss 0.035, col train loss 138.476


Epoch 1167: 0batch [00:00, ?batch/s]

epoch 1166: avg test  loss 1543.21, bar  test loss 3.638, len  test loss 0.036, col  test loss 140.119


Epoch 1167: 272batch [00:41,  6.57batch/s, loss=1.44e+3]


epoch 1167: avg train loss 1530.72, bar train loss 3.406, len train loss 0.035, col train loss 138.682


Epoch 1168: 1batch [00:00,  7.19batch/s, loss=1.6e+3]

epoch 1167: avg test  loss 1548.39, bar  test loss 3.684, len  test loss 0.035, col  test loss 139.882


Epoch 1168: 272batch [00:41,  6.57batch/s, loss=1.51e+3]


epoch 1168: avg train loss 1533.53, bar train loss 3.552, len train loss 0.035, col train loss 138.436


Epoch 1169: 1batch [00:00,  7.63batch/s, loss=1.52e+3]

epoch 1168: avg test  loss 1568.16, bar  test loss 5.475, len  test loss 0.036, col  test loss 140.254


Epoch 1169: 272batch [00:41,  6.56batch/s, loss=1.65e+3]


epoch 1169: avg train loss 1533.49, bar train loss 3.467, len train loss 0.036, col train loss 138.810


Epoch 1170: 1batch [00:00,  7.52batch/s, loss=1.56e+3]

epoch 1169: avg test  loss 1550.62, bar  test loss 3.595, len  test loss 0.038, col  test loss 140.690


Epoch 1170: 272batch [00:41,  6.55batch/s, loss=1.5e+3] 


epoch 1170: avg train loss 1530.50, bar train loss 3.452, len train loss 0.035, col train loss 138.200
epoch 1170: avg test  loss 1586.44, bar  test loss 7.346, len  test loss 0.037, col  test loss 139.766


Epoch 1171: 272batch [00:44,  6.12batch/s, loss=1.6e+3] 


epoch 1171: avg train loss 1531.91, bar train loss 3.680, len train loss 0.034, col train loss 138.302


Epoch 1172: 1batch [00:00,  7.09batch/s, loss=1.53e+3]

epoch 1171: avg test  loss 1546.50, bar  test loss 3.218, len  test loss 0.036, col  test loss 139.695


Epoch 1172: 272batch [00:41,  6.54batch/s, loss=1.58e+3]


epoch 1172: avg train loss 1528.03, bar train loss 3.344, len train loss 0.034, col train loss 138.094


Epoch 1173: 1batch [00:00,  6.99batch/s, loss=1.54e+3]

epoch 1172: avg test  loss 1538.70, bar  test loss 3.741, len  test loss 0.038, col  test loss 139.251


Epoch 1173: 272batch [00:41,  6.57batch/s, loss=1.55e+3]


epoch 1173: avg train loss 1528.20, bar train loss 3.328, len train loss 0.034, col train loss 138.277


Epoch 1174: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1173: avg test  loss 1544.31, bar  test loss 3.244, len  test loss 0.036, col  test loss 139.705


Epoch 1174: 272batch [00:41,  6.48batch/s, loss=1.58e+3]


epoch 1174: avg train loss 1531.43, bar train loss 3.392, len train loss 0.039, col train loss 138.617


Epoch 1175: 1batch [00:00,  7.52batch/s, loss=1.57e+3]

epoch 1174: avg test  loss 1541.44, bar  test loss 3.954, len  test loss 0.037, col  test loss 139.570


Epoch 1175: 272batch [00:41,  6.58batch/s, loss=1.6e+3] 


epoch 1175: avg train loss 1531.54, bar train loss 3.607, len train loss 0.039, col train loss 138.579
epoch 1175: avg test  loss 1543.27, bar  test loss 3.580, len  test loss 0.039, col  test loss 139.991


Epoch 1176: 272batch [00:43,  6.19batch/s, loss=1.49e+3]


epoch 1176: avg train loss 1531.60, bar train loss 3.633, len train loss 0.033, col train loss 138.410


Epoch 1177: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1176: avg test  loss 1548.91, bar  test loss 4.426, len  test loss 0.035, col  test loss 138.691


Epoch 1177: 272batch [00:41,  6.52batch/s, loss=1.62e+3]


epoch 1177: avg train loss 1530.78, bar train loss 3.472, len train loss 0.035, col train loss 138.196


Epoch 1178: 1batch [00:00,  7.47batch/s, loss=1.55e+3]

epoch 1177: avg test  loss 1556.39, bar  test loss 4.050, len  test loss 0.039, col  test loss 140.599


Epoch 1178: 272batch [00:41,  6.58batch/s, loss=1.57e+3]


epoch 1178: avg train loss 1535.30, bar train loss 3.604, len train loss 0.036, col train loss 138.574


Epoch 1179: 0batch [00:00, ?batch/s, loss=1.6e+3]

epoch 1178: avg test  loss 1557.15, bar  test loss 4.979, len  test loss 0.033, col  test loss 139.336


Epoch 1179: 272batch [00:41,  6.51batch/s, loss=1.55e+3]


epoch 1179: avg train loss 1532.98, bar train loss 3.523, len train loss 0.036, col train loss 138.468


Epoch 1180: 1batch [00:00,  7.52batch/s, loss=1.54e+3]

epoch 1179: avg test  loss 1551.32, bar  test loss 4.069, len  test loss 0.040, col  test loss 139.525


Epoch 1180: 272batch [00:41,  6.53batch/s, loss=1.72e+3]


epoch 1180: avg train loss 1534.79, bar train loss 3.509, len train loss 0.035, col train loss 138.692
epoch 1180: avg test  loss 1577.65, bar  test loss 5.772, len  test loss 0.044, col  test loss 141.257


Epoch 1181: 272batch [00:44,  6.12batch/s, loss=1.59e+3]


epoch 1181: avg train loss 1534.26, bar train loss 3.581, len train loss 0.034, col train loss 138.624


Epoch 1182: 1batch [00:00,  7.30batch/s, loss=1.47e+3]

epoch 1181: avg test  loss 1540.86, bar  test loss 3.610, len  test loss 0.035, col  test loss 138.821


Epoch 1182: 272batch [00:41,  6.49batch/s, loss=1.47e+3]


epoch 1182: avg train loss 1536.51, bar train loss 3.855, len train loss 0.036, col train loss 138.647


Epoch 1183: 1batch [00:00,  6.94batch/s, loss=1.53e+3]

epoch 1182: avg test  loss 1559.59, bar  test loss 5.178, len  test loss 0.040, col  test loss 140.883


Epoch 1183: 272batch [00:41,  6.56batch/s, loss=1.61e+3]


epoch 1183: avg train loss 1533.29, bar train loss 3.515, len train loss 0.035, col train loss 138.605


Epoch 1184: 0batch [00:00, ?batch/s, loss=1.5e+3]

epoch 1183: avg test  loss 1539.69, bar  test loss 3.537, len  test loss 0.037, col  test loss 138.986


Epoch 1184: 272batch [00:41,  6.54batch/s, loss=1.63e+3]


epoch 1184: avg train loss 1527.31, bar train loss 3.332, len train loss 0.035, col train loss 138.375


Epoch 1185: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1184: avg test  loss 1541.42, bar  test loss 3.513, len  test loss 0.033, col  test loss 139.303


Epoch 1185: 272batch [00:41,  6.51batch/s, loss=1.65e+3]


epoch 1185: avg train loss 1534.41, bar train loss 3.546, len train loss 0.036, col train loss 138.631
epoch 1185: avg test  loss 1546.85, bar  test loss 3.821, len  test loss 0.038, col  test loss 139.655


Epoch 1186: 272batch [00:43,  6.18batch/s, loss=1.54e+3]


epoch 1186: avg train loss 1532.11, bar train loss 3.350, len train loss 0.035, col train loss 138.036


Epoch 1187: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1186: avg test  loss 1540.79, bar  test loss 3.497, len  test loss 0.039, col  test loss 139.392


Epoch 1187: 272batch [00:42,  6.47batch/s, loss=1.53e+3]


epoch 1187: avg train loss 1532.47, bar train loss 3.561, len train loss 0.035, col train loss 138.353


Epoch 1188: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1187: avg test  loss 1553.55, bar  test loss 4.430, len  test loss 0.034, col  test loss 139.636


Epoch 1188: 272batch [00:41,  6.48batch/s, loss=1.72e+3]


epoch 1188: avg train loss 1531.91, bar train loss 3.503, len train loss 0.034, col train loss 138.620


Epoch 1189: 0batch [00:00, ?batch/s, loss=1.73e+3]

epoch 1188: avg test  loss 1683.72, bar  test loss 17.614, len  test loss 0.034, col  test loss 139.176


Epoch 1189: 272batch [00:41,  6.52batch/s, loss=1.55e+3]


epoch 1189: avg train loss 1550.79, bar train loss 5.486, len train loss 0.035, col train loss 138.562


Epoch 1190: 1batch [00:00,  7.81batch/s, loss=1.6e+3]

epoch 1189: avg test  loss 1544.08, bar  test loss 3.516, len  test loss 0.037, col  test loss 140.163


Epoch 1190: 272batch [00:41,  6.51batch/s, loss=1.58e+3]


epoch 1190: avg train loss 1535.12, bar train loss 3.573, len train loss 0.037, col train loss 138.696
epoch 1190: avg test  loss 1551.37, bar  test loss 3.535, len  test loss 0.035, col  test loss 140.908


Epoch 1191: 272batch [00:45,  6.04batch/s, loss=1.54e+3]


epoch 1191: avg train loss 1534.74, bar train loss 3.704, len train loss 0.034, col train loss 138.690


Epoch 1192: 1batch [00:00,  6.76batch/s, loss=1.53e+3]

epoch 1191: avg test  loss 1551.96, bar  test loss 3.972, len  test loss 0.036, col  test loss 139.612


Epoch 1192: 272batch [00:41,  6.51batch/s, loss=1.47e+3]


epoch 1192: avg train loss 1535.05, bar train loss 3.469, len train loss 0.036, col train loss 138.568


Epoch 1193: 1batch [00:00,  7.41batch/s, loss=1.53e+3]

epoch 1192: avg test  loss 1553.81, bar  test loss 4.651, len  test loss 0.036, col  test loss 139.522


Epoch 1193: 272batch [00:41,  6.49batch/s, loss=1.63e+3]


epoch 1193: avg train loss 1537.92, bar train loss 3.759, len train loss 0.034, col train loss 138.747


Epoch 1194: 1batch [00:00,  7.14batch/s, loss=1.51e+3]

epoch 1193: avg test  loss 1545.84, bar  test loss 3.820, len  test loss 0.039, col  test loss 139.996


Epoch 1194: 272batch [00:41,  6.51batch/s, loss=1.52e+3]


epoch 1194: avg train loss 1537.31, bar train loss 3.625, len train loss 0.037, col train loss 139.027


Epoch 1195: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1194: avg test  loss 1555.63, bar  test loss 3.560, len  test loss 0.035, col  test loss 139.459


Epoch 1195: 272batch [00:42,  6.42batch/s, loss=1.49e+3]


epoch 1195: avg train loss 1534.77, bar train loss 3.411, len train loss 0.035, col train loss 138.788
epoch 1195: avg test  loss 1545.92, bar  test loss 3.471, len  test loss 0.038, col  test loss 140.195


Epoch 1196: 272batch [00:44,  6.11batch/s, loss=1.4e+3] 


epoch 1196: avg train loss 1534.78, bar train loss 3.509, len train loss 0.036, col train loss 138.698


Epoch 1197: 0batch [00:00, ?batch/s]

epoch 1196: avg test  loss 1551.07, bar  test loss 3.531, len  test loss 0.038, col  test loss 140.237


Epoch 1197: 272batch [00:42,  6.42batch/s, loss=1.59e+3]


epoch 1197: avg train loss 1536.28, bar train loss 3.451, len train loss 0.037, col train loss 138.889


Epoch 1198: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1197: avg test  loss 1546.36, bar  test loss 3.451, len  test loss 0.038, col  test loss 138.493


Epoch 1198: 272batch [00:42,  6.44batch/s, loss=1.61e+3]


epoch 1198: avg train loss 1536.41, bar train loss 3.652, len train loss 0.038, col train loss 138.722


Epoch 1199: 0batch [00:00, ?batch/s]

epoch 1198: avg test  loss 1557.49, bar  test loss 4.388, len  test loss 0.042, col  test loss 140.984


Epoch 1199: 272batch [00:42,  6.47batch/s, loss=1.46e+3]


epoch 1199: avg train loss 1532.21, bar train loss 3.538, len train loss 0.037, col train loss 138.772


Epoch 1200: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1199: avg test  loss 1545.04, bar  test loss 3.464, len  test loss 0.036, col  test loss 141.094


Epoch 1200: 272batch [00:42,  6.46batch/s, loss=1.5e+3] 


epoch 1200: avg train loss 1533.95, bar train loss 3.431, len train loss 0.036, col train loss 138.667
epoch 1200: avg test  loss 1546.86, bar  test loss 3.832, len  test loss 0.040, col  test loss 139.384


Epoch 1201: 272batch [00:45,  6.03batch/s, loss=1.44e+3]


epoch 1201: avg train loss 1534.74, bar train loss 3.589, len train loss 0.034, col train loss 138.675


Epoch 1202: 0batch [00:00, ?batch/s]

epoch 1201: avg test  loss 1548.99, bar  test loss 3.853, len  test loss 0.035, col  test loss 139.201


Epoch 1202: 272batch [00:42,  6.45batch/s, loss=1.63e+3]


epoch 1202: avg train loss 1536.40, bar train loss 3.476, len train loss 0.035, col train loss 139.161


Epoch 1203: 1batch [00:00,  6.99batch/s, loss=1.58e+3]

epoch 1202: avg test  loss 1549.82, bar  test loss 3.470, len  test loss 0.042, col  test loss 140.366


Epoch 1203: 272batch [00:42,  6.47batch/s, loss=1.6e+3] 


epoch 1203: avg train loss 1534.56, bar train loss 3.603, len train loss 0.033, col train loss 138.454


Epoch 1204: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1203: avg test  loss 1548.24, bar  test loss 3.593, len  test loss 0.036, col  test loss 138.996


Epoch 1204: 272batch [00:41,  6.49batch/s, loss=1.5e+3] 


epoch 1204: avg train loss 1533.23, bar train loss 3.413, len train loss 0.034, col train loss 138.643


Epoch 1205: 1batch [00:00,  7.30batch/s, loss=1.52e+3]

epoch 1204: avg test  loss 1547.16, bar  test loss 3.664, len  test loss 0.036, col  test loss 138.790


Epoch 1205: 272batch [00:42,  6.45batch/s, loss=1.43e+3]


epoch 1205: avg train loss 1534.28, bar train loss 3.746, len train loss 0.035, col train loss 138.212
epoch 1205: avg test  loss 1545.61, bar  test loss 3.582, len  test loss 0.038, col  test loss 139.611


Epoch 1206: 272batch [00:44,  6.05batch/s, loss=1.51e+3]


epoch 1206: avg train loss 1531.01, bar train loss 3.362, len train loss 0.035, col train loss 138.335


Epoch 1207: 0batch [00:00, ?batch/s]

epoch 1206: avg test  loss 1547.68, bar  test loss 3.372, len  test loss 0.035, col  test loss 139.840


Epoch 1207: 272batch [00:41,  6.50batch/s, loss=1.59e+3]


epoch 1207: avg train loss 1532.16, bar train loss 3.366, len train loss 0.035, col train loss 138.587


Epoch 1208: 0batch [00:00, ?batch/s, loss=1.48e+3]

epoch 1207: avg test  loss 1552.20, bar  test loss 3.654, len  test loss 0.035, col  test loss 139.903


Epoch 1208: 272batch [00:41,  6.49batch/s, loss=1.77e+3]


epoch 1208: avg train loss 1537.68, bar train loss 3.590, len train loss 0.035, col train loss 138.850


Epoch 1209: 0batch [00:00, ?batch/s]

epoch 1208: avg test  loss 1551.22, bar  test loss 3.747, len  test loss 0.047, col  test loss 139.662


Epoch 1209: 272batch [00:41,  6.52batch/s, loss=1.67e+3]


epoch 1209: avg train loss 1532.84, bar train loss 3.513, len train loss 0.035, col train loss 138.593


Epoch 1210: 0batch [00:00, ?batch/s]

epoch 1209: avg test  loss 1575.72, bar  test loss 6.096, len  test loss 0.036, col  test loss 139.741


Epoch 1210: 272batch [00:41,  6.51batch/s, loss=1.53e+3]


epoch 1210: avg train loss 1537.34, bar train loss 3.713, len train loss 0.037, col train loss 138.659
epoch 1210: avg test  loss 1558.30, bar  test loss 4.552, len  test loss 0.034, col  test loss 139.628


Epoch 1211: 272batch [00:44,  6.09batch/s, loss=1.44e+3]


epoch 1211: avg train loss 1541.08, bar train loss 3.680, len train loss 0.037, col train loss 139.283


Epoch 1212: 1batch [00:00,  8.20batch/s, loss=1.55e+3]

epoch 1211: avg test  loss 1592.00, bar  test loss 6.464, len  test loss 0.040, col  test loss 141.866


Epoch 1212: 272batch [00:42,  6.47batch/s, loss=1.58e+3]


epoch 1212: avg train loss 1539.02, bar train loss 3.692, len train loss 0.035, col train loss 138.774


Epoch 1213: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1212: avg test  loss 1561.08, bar  test loss 5.008, len  test loss 0.041, col  test loss 139.787


Epoch 1213: 272batch [00:41,  6.48batch/s, loss=1.58e+3]


epoch 1213: avg train loss 1538.42, bar train loss 3.481, len train loss 0.036, col train loss 139.130
epoch 1213: avg test  loss 1560.37, bar  test loss 3.938, len  test loss 0.042, col  test loss 141.637


Epoch 1214: 272batch [00:42,  6.45batch/s, loss=1.62e+3]


epoch 1214: avg train loss 1538.13, bar train loss 3.603, len train loss 0.035, col train loss 138.987


Epoch 1215: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 1214: avg test  loss 1555.84, bar  test loss 3.789, len  test loss 0.034, col  test loss 139.467


Epoch 1215: 272batch [00:42,  6.45batch/s, loss=1.63e+3]


epoch 1215: avg train loss 1539.61, bar train loss 3.654, len train loss 0.037, col train loss 139.275
epoch 1215: avg test  loss 1558.93, bar  test loss 4.114, len  test loss 0.044, col  test loss 141.334


Epoch 1216: 272batch [00:44,  6.09batch/s, loss=1.6e+3] 


epoch 1216: avg train loss 1538.27, bar train loss 3.599, len train loss 0.035, col train loss 139.018


Epoch 1217: 0batch [00:00, ?batch/s]

epoch 1216: avg test  loss 1559.97, bar  test loss 5.015, len  test loss 0.037, col  test loss 140.052


Epoch 1217: 272batch [00:42,  6.37batch/s, loss=1.51e+3]


epoch 1217: avg train loss 1537.43, bar train loss 3.507, len train loss 0.036, col train loss 138.999


Epoch 1218: 1batch [00:00,  7.81batch/s, loss=1.59e+3]

epoch 1217: avg test  loss 1564.28, bar  test loss 4.910, len  test loss 0.036, col  test loss 141.182


Epoch 1218: 272batch [00:41,  6.49batch/s, loss=1.65e+3]


epoch 1218: avg train loss 1534.71, bar train loss 3.439, len train loss 0.036, col train loss 138.773


Epoch 1219: 0batch [00:00, ?batch/s, loss=1.48e+3]

epoch 1218: avg test  loss 1552.10, bar  test loss 3.894, len  test loss 0.037, col  test loss 139.639


Epoch 1219: 272batch [00:42,  6.44batch/s, loss=1.43e+3]


epoch 1219: avg train loss 1538.41, bar train loss 3.577, len train loss 0.035, col train loss 138.770


Epoch 1220: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1219: avg test  loss 1546.50, bar  test loss 3.388, len  test loss 0.038, col  test loss 140.069


Epoch 1220: 272batch [00:42,  6.46batch/s, loss=1.47e+3]


epoch 1220: avg train loss 1534.54, bar train loss 3.441, len train loss 0.036, col train loss 138.361
epoch 1220: avg test  loss 1559.66, bar  test loss 3.574, len  test loss 0.037, col  test loss 141.167


Epoch 1221: 272batch [00:44,  6.07batch/s, loss=1.52e+3]


epoch 1221: avg train loss 1536.78, bar train loss 3.481, len train loss 0.035, col train loss 138.847


Epoch 1222: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1221: avg test  loss 1558.73, bar  test loss 4.721, len  test loss 0.037, col  test loss 139.836


Epoch 1222: 272batch [00:42,  6.46batch/s, loss=1.52e+3]


epoch 1222: avg train loss 1545.35, bar train loss 3.685, len train loss 0.036, col train loss 139.446


Epoch 1223: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1222: avg test  loss 1555.67, bar  test loss 3.525, len  test loss 0.038, col  test loss 140.907


Epoch 1223: 272batch [00:42,  6.45batch/s, loss=1.53e+3]


epoch 1223: avg train loss 1540.19, bar train loss 3.530, len train loss 0.036, col train loss 139.397


Epoch 1224: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1223: avg test  loss 1552.84, bar  test loss 4.018, len  test loss 0.039, col  test loss 139.749


Epoch 1224: 272batch [00:42,  6.44batch/s, loss=1.53e+3]


epoch 1224: avg train loss 1536.59, bar train loss 3.529, len train loss 0.036, col train loss 138.667


Epoch 1225: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1224: avg test  loss 1555.26, bar  test loss 3.969, len  test loss 0.039, col  test loss 140.725


Epoch 1225: 272batch [00:43,  6.30batch/s, loss=1.57e+3]


epoch 1225: avg train loss 1541.27, bar train loss 3.542, len train loss 0.035, col train loss 139.499
epoch 1225: avg test  loss 1547.47, bar  test loss 3.579, len  test loss 0.037, col  test loss 141.055


Epoch 1226: 272batch [00:44,  6.08batch/s, loss=1.58e+3]


epoch 1226: avg train loss 1537.94, bar train loss 3.615, len train loss 0.036, col train loss 139.106


Epoch 1227: 1batch [00:00,  7.04batch/s, loss=1.58e+3]

epoch 1226: avg test  loss 1557.94, bar  test loss 4.245, len  test loss 0.039, col  test loss 140.395


Epoch 1227: 272batch [00:42,  6.46batch/s, loss=1.63e+3]


epoch 1227: avg train loss 1539.40, bar train loss 3.448, len train loss 0.036, col train loss 139.420


Epoch 1228: 1batch [00:00,  7.46batch/s, loss=1.59e+3]

epoch 1227: avg test  loss 1551.18, bar  test loss 3.578, len  test loss 0.036, col  test loss 140.633


Epoch 1228: 272batch [00:42,  6.43batch/s, loss=1.59e+3]


epoch 1228: avg train loss 1537.38, bar train loss 3.609, len train loss 0.036, col train loss 139.073


Epoch 1229: 0batch [00:00, ?batch/s, loss=1.61e+3]

epoch 1228: avg test  loss 1554.54, bar  test loss 3.711, len  test loss 0.037, col  test loss 140.596


Epoch 1229: 272batch [00:42,  6.40batch/s, loss=1.5e+3] 


epoch 1229: avg train loss 1538.77, bar train loss 3.468, len train loss 0.036, col train loss 139.221


Epoch 1230: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1229: avg test  loss 1548.36, bar  test loss 3.478, len  test loss 0.040, col  test loss 140.579


Epoch 1230: 272batch [00:41,  6.50batch/s, loss=1.65e+3]


epoch 1230: avg train loss 1538.07, bar train loss 3.423, len train loss 0.036, col train loss 138.889
epoch 1230: avg test  loss 1557.17, bar  test loss 4.238, len  test loss 0.037, col  test loss 139.838


Epoch 1231: 272batch [00:46,  5.85batch/s, loss=1.48e+3]


epoch 1231: avg train loss 1540.07, bar train loss 3.627, len train loss 0.038, col train loss 138.770


Epoch 1232: 1batch [00:00,  7.04batch/s, loss=1.51e+3]

epoch 1231: avg test  loss 1579.36, bar  test loss 5.726, len  test loss 0.042, col  test loss 139.405


Epoch 1232: 272batch [00:43,  6.23batch/s, loss=1.5e+3] 


epoch 1232: avg train loss 1538.31, bar train loss 3.813, len train loss 0.035, col train loss 138.873


Epoch 1233: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1232: avg test  loss 1551.01, bar  test loss 3.852, len  test loss 0.037, col  test loss 139.715


Epoch 1233: 272batch [00:43,  6.29batch/s, loss=1.54e+3]


epoch 1233: avg train loss 1539.23, bar train loss 3.601, len train loss 0.036, col train loss 138.928


Epoch 1234: 0batch [00:00, ?batch/s]

epoch 1233: avg test  loss 1559.53, bar  test loss 4.229, len  test loss 0.036, col  test loss 140.368


Epoch 1234: 272batch [00:43,  6.18batch/s, loss=1.52e+3]


epoch 1234: avg train loss 1538.24, bar train loss 3.592, len train loss 0.036, col train loss 139.173


Epoch 1235: 0batch [00:00, ?batch/s]

epoch 1234: avg test  loss 1549.49, bar  test loss 3.931, len  test loss 0.034, col  test loss 140.568


Epoch 1235: 272batch [00:42,  6.36batch/s, loss=1.62e+3]


epoch 1235: avg train loss 1538.32, bar train loss 3.654, len train loss 0.036, col train loss 138.939
epoch 1235: avg test  loss 1554.56, bar  test loss 3.726, len  test loss 0.038, col  test loss 139.583


Epoch 1236: 272batch [00:45,  6.03batch/s, loss=1.52e+3]


epoch 1236: avg train loss 1538.91, bar train loss 3.506, len train loss 0.035, col train loss 139.456


Epoch 1237: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1236: avg test  loss 1555.07, bar  test loss 3.580, len  test loss 0.038, col  test loss 140.838


Epoch 1237: 272batch [00:42,  6.37batch/s, loss=1.46e+3]


epoch 1237: avg train loss 1542.70, bar train loss 3.502, len train loss 0.036, col train loss 139.213


Epoch 1238: 0batch [00:00, ?batch/s, loss=1.59e+3]

epoch 1237: avg test  loss 1562.53, bar  test loss 3.712, len  test loss 0.044, col  test loss 139.974


Epoch 1238: 272batch [00:41,  6.58batch/s, loss=1.55e+3]


epoch 1238: avg train loss 1541.11, bar train loss 3.596, len train loss 0.036, col train loss 139.232


Epoch 1239: 0batch [00:00, ?batch/s]

epoch 1238: avg test  loss 1546.12, bar  test loss 3.458, len  test loss 0.036, col  test loss 140.023


Epoch 1239: 272batch [00:42,  6.45batch/s, loss=1.55e+3]


epoch 1239: avg train loss 1537.19, bar train loss 3.501, len train loss 0.034, col train loss 139.271


Epoch 1240: 1batch [00:00,  7.94batch/s, loss=1.52e+3]

epoch 1239: avg test  loss 1559.32, bar  test loss 4.322, len  test loss 0.038, col  test loss 141.197


Epoch 1240: 272batch [00:41,  6.56batch/s, loss=1.4e+3] 


epoch 1240: avg train loss 1538.12, bar train loss 3.629, len train loss 0.036, col train loss 138.821
epoch 1240: avg test  loss 1543.97, bar  test loss 3.639, len  test loss 0.042, col  test loss 139.118


Epoch 1241: 272batch [00:41,  6.58batch/s, loss=1.45e+3]


epoch 1241: avg train loss 1541.15, bar train loss 3.709, len train loss 0.038, col train loss 139.542


Epoch 1242: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1241: avg test  loss 1554.17, bar  test loss 3.525, len  test loss 0.037, col  test loss 140.286


Epoch 1242: 272batch [00:41,  6.61batch/s, loss=1.56e+3]


epoch 1242: avg train loss 1541.48, bar train loss 3.592, len train loss 0.034, col train loss 139.460


Epoch 1243: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1242: avg test  loss 1549.28, bar  test loss 3.399, len  test loss 0.037, col  test loss 140.598


Epoch 1243: 272batch [00:41,  6.59batch/s, loss=1.5e+3] 


epoch 1243: avg train loss 1537.09, bar train loss 3.362, len train loss 0.035, col train loss 139.146


Epoch 1244: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1243: avg test  loss 1543.44, bar  test loss 3.376, len  test loss 0.036, col  test loss 139.771


Epoch 1244: 272batch [00:41,  6.61batch/s, loss=1.42e+3]


epoch 1244: avg train loss 1539.00, bar train loss 3.557, len train loss 0.035, col train loss 139.442


Epoch 1245: 0batch [00:00, ?batch/s, loss=1.46e+3]

epoch 1244: avg test  loss 1556.97, bar  test loss 4.215, len  test loss 0.040, col  test loss 140.738


Epoch 1245: 272batch [00:41,  6.61batch/s, loss=1.61e+3]


epoch 1245: avg train loss 1540.52, bar train loss 3.582, len train loss 0.038, col train loss 139.019
epoch 1245: avg test  loss 1578.24, bar  test loss 6.254, len  test loss 0.036, col  test loss 139.863


Epoch 1246: 272batch [00:41,  6.58batch/s, loss=1.53e+3]


epoch 1246: avg train loss 1541.45, bar train loss 3.571, len train loss 0.036, col train loss 139.663


Epoch 1247: 0batch [00:00, ?batch/s]

epoch 1246: avg test  loss 1598.04, bar  test loss 7.565, len  test loss 0.037, col  test loss 140.581


Epoch 1247: 272batch [00:42,  6.46batch/s, loss=1.52e+3]


epoch 1247: avg train loss 1541.90, bar train loss 3.800, len train loss 0.035, col train loss 139.348


Epoch 1248: 0batch [00:00, ?batch/s]

epoch 1247: avg test  loss 1551.18, bar  test loss 3.750, len  test loss 0.038, col  test loss 140.229


Epoch 1248: 272batch [00:42,  6.37batch/s, loss=1.61e+3]


epoch 1248: avg train loss 1543.83, bar train loss 3.966, len train loss 0.037, col train loss 139.419


Epoch 1249: 1batch [00:00,  6.89batch/s, loss=1.49e+3]

epoch 1248: avg test  loss 1553.99, bar  test loss 3.609, len  test loss 0.036, col  test loss 140.383


Epoch 1249: 272batch [00:41,  6.49batch/s, loss=1.67e+3]


epoch 1249: avg train loss 1536.46, bar train loss 3.419, len train loss 0.035, col train loss 139.195


Epoch 1250: 1batch [00:00,  7.09batch/s, loss=1.56e+3]

epoch 1249: avg test  loss 1550.47, bar  test loss 3.849, len  test loss 0.038, col  test loss 140.574


Epoch 1250: 272batch [00:41,  6.51batch/s, loss=1.58e+3]


epoch 1250: avg train loss 1540.58, bar train loss 3.616, len train loss 0.035, col train loss 139.656
epoch 1250: avg test  loss 1549.51, bar  test loss 3.497, len  test loss 0.035, col  test loss 139.829


Epoch 1251: 272batch [00:41,  6.57batch/s, loss=1.54e+3]


epoch 1251: avg train loss 1535.64, bar train loss 3.557, len train loss 0.035, col train loss 139.082


Epoch 1252: 1batch [00:00,  6.62batch/s, loss=1.56e+3]

epoch 1251: avg test  loss 1550.98, bar  test loss 3.821, len  test loss 0.036, col  test loss 140.362


Epoch 1252: 272batch [00:41,  6.59batch/s, loss=1.58e+3]


epoch 1252: avg train loss 1541.99, bar train loss 3.520, len train loss 0.036, col train loss 139.523


Epoch 1253: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1252: avg test  loss 1559.82, bar  test loss 4.593, len  test loss 0.037, col  test loss 139.665


Epoch 1253: 272batch [00:41,  6.61batch/s, loss=1.59e+3]


epoch 1253: avg train loss 1541.49, bar train loss 3.552, len train loss 0.035, col train loss 139.289


Epoch 1254: 0batch [00:00, ?batch/s, loss=1.62e+3]

epoch 1253: avg test  loss 1553.93, bar  test loss 3.883, len  test loss 0.037, col  test loss 140.141


Epoch 1254: 272batch [00:41,  6.59batch/s, loss=1.58e+3]


epoch 1254: avg train loss 1549.79, bar train loss 3.675, len train loss 0.037, col train loss 140.121


Epoch 1255: 1batch [00:00,  6.67batch/s, loss=1.62e+3]

epoch 1254: avg test  loss 1564.17, bar  test loss 4.475, len  test loss 0.035, col  test loss 141.358


Epoch 1255: 272batch [00:41,  6.57batch/s, loss=1.6e+3] 


epoch 1255: avg train loss 1542.07, bar train loss 3.689, len train loss 0.036, col train loss 139.108
epoch 1255: avg test  loss 1557.66, bar  test loss 3.864, len  test loss 0.040, col  test loss 140.683


Epoch 1256: 272batch [00:41,  6.49batch/s, loss=1.44e+3]


epoch 1256: avg train loss 1540.74, bar train loss 3.558, len train loss 0.038, col train loss 139.213


Epoch 1257: 1batch [00:00,  7.25batch/s, loss=1.52e+3]

epoch 1256: avg test  loss 1550.69, bar  test loss 3.477, len  test loss 0.039, col  test loss 141.057


Epoch 1257: 272batch [00:41,  6.52batch/s, loss=1.57e+3]


epoch 1257: avg train loss 1539.52, bar train loss 3.388, len train loss 0.034, col train loss 139.535


Epoch 1258: 0batch [00:00, ?batch/s]

epoch 1257: avg test  loss 1550.63, bar  test loss 3.677, len  test loss 0.036, col  test loss 140.277


Epoch 1258: 272batch [00:41,  6.54batch/s, loss=1.48e+3]


epoch 1258: avg train loss 1537.01, bar train loss 3.564, len train loss 0.035, col train loss 139.231


Epoch 1259: 1batch [00:00,  7.52batch/s, loss=1.55e+3]

epoch 1258: avg test  loss 1549.78, bar  test loss 3.718, len  test loss 0.035, col  test loss 140.400


Epoch 1259: 272batch [00:41,  6.59batch/s, loss=1.62e+3]


epoch 1259: avg train loss 1542.12, bar train loss 3.640, len train loss 0.035, col train loss 139.355


Epoch 1260: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1259: avg test  loss 1553.90, bar  test loss 3.578, len  test loss 0.037, col  test loss 140.624


Epoch 1260: 272batch [00:41,  6.56batch/s, loss=1.48e+3]


epoch 1260: avg train loss 1541.81, bar train loss 3.520, len train loss 0.035, col train loss 139.177
epoch 1260: avg test  loss 1573.85, bar  test loss 5.050, len  test loss 0.039, col  test loss 141.565


Epoch 1261: 272batch [00:41,  6.56batch/s, loss=1.53e+3]


epoch 1261: avg train loss 1540.24, bar train loss 3.562, len train loss 0.037, col train loss 139.725


Epoch 1262: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1261: avg test  loss 1547.96, bar  test loss 3.769, len  test loss 0.037, col  test loss 140.254


Epoch 1262: 272batch [00:41,  6.54batch/s, loss=1.47e+3]


epoch 1262: avg train loss 1539.57, bar train loss 3.548, len train loss 0.036, col train loss 139.747


Epoch 1263: 0batch [00:00, ?batch/s]

epoch 1262: avg test  loss 1562.12, bar  test loss 4.124, len  test loss 0.037, col  test loss 141.883


Epoch 1263: 272batch [00:42,  6.46batch/s, loss=1.59e+3]


epoch 1263: avg train loss 1540.20, bar train loss 3.545, len train loss 0.035, col train loss 139.484


Epoch 1264: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1263: avg test  loss 1555.64, bar  test loss 3.671, len  test loss 0.040, col  test loss 140.794


Epoch 1264: 272batch [00:41,  6.54batch/s, loss=1.43e+3]


epoch 1264: avg train loss 1542.11, bar train loss 3.544, len train loss 0.037, col train loss 139.711


Epoch 1265: 1batch [00:00,  7.25batch/s, loss=1.59e+3]

epoch 1264: avg test  loss 1561.84, bar  test loss 3.609, len  test loss 0.042, col  test loss 141.577


Epoch 1265: 272batch [00:41,  6.57batch/s, loss=1.6e+3] 


epoch 1265: avg train loss 1542.35, bar train loss 3.416, len train loss 0.035, col train loss 139.660
epoch 1265: avg test  loss 1569.02, bar  test loss 4.745, len  test loss 0.039, col  test loss 140.963


Epoch 1266: 272batch [00:42,  6.47batch/s, loss=1.45e+3]


epoch 1266: avg train loss 1546.64, bar train loss 3.758, len train loss 0.038, col train loss 140.254


Epoch 1267: 1batch [00:00,  7.30batch/s, loss=1.58e+3]

epoch 1266: avg test  loss 1554.24, bar  test loss 3.691, len  test loss 0.041, col  test loss 140.832


Epoch 1267: 272batch [00:41,  6.57batch/s, loss=1.38e+3]


epoch 1267: avg train loss 1544.87, bar train loss 3.778, len train loss 0.038, col train loss 139.599


Epoch 1268: 1batch [00:00,  7.94batch/s, loss=1.54e+3]

epoch 1267: avg test  loss 1559.07, bar  test loss 3.746, len  test loss 0.047, col  test loss 141.243


Epoch 1268: 272batch [00:41,  6.49batch/s, loss=1.73e+3]


epoch 1268: avg train loss 1546.44, bar train loss 3.576, len train loss 0.038, col train loss 139.736


Epoch 1269: 0batch [00:00, ?batch/s, loss=1.61e+3]

epoch 1268: avg test  loss 1560.86, bar  test loss 3.837, len  test loss 0.038, col  test loss 141.663


Epoch 1269: 272batch [00:42,  6.46batch/s, loss=1.64e+3]


epoch 1269: avg train loss 1546.94, bar train loss 3.752, len train loss 0.037, col train loss 140.029


Epoch 1270: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 1269: avg test  loss 1565.34, bar  test loss 4.094, len  test loss 0.049, col  test loss 142.380


Epoch 1270: 272batch [00:41,  6.53batch/s, loss=1.62e+3]


epoch 1270: avg train loss 1546.27, bar train loss 3.581, len train loss 0.036, col train loss 139.872
epoch 1270: avg test  loss 1554.22, bar  test loss 3.738, len  test loss 0.034, col  test loss 139.747


Epoch 1271: 272batch [00:41,  6.50batch/s, loss=1.56e+3]


epoch 1271: avg train loss 1543.80, bar train loss 3.543, len train loss 0.034, col train loss 139.687


Epoch 1272: 1batch [00:00,  7.69batch/s, loss=1.52e+3]

epoch 1271: avg test  loss 1560.71, bar  test loss 3.705, len  test loss 0.036, col  test loss 141.220


Epoch 1272: 272batch [00:41,  6.51batch/s, loss=1.71e+3]


epoch 1272: avg train loss 1546.30, bar train loss 3.651, len train loss 0.036, col train loss 139.962


Epoch 1273: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1272: avg test  loss 1553.15, bar  test loss 3.832, len  test loss 0.037, col  test loss 141.143


Epoch 1273: 272batch [00:42,  6.42batch/s, loss=1.48e+3]


epoch 1273: avg train loss 1544.61, bar train loss 3.625, len train loss 0.037, col train loss 140.155


Epoch 1274: 0batch [00:00, ?batch/s]

epoch 1273: avg test  loss 1572.58, bar  test loss 4.092, len  test loss 0.043, col  test loss 142.215


Epoch 1274: 272batch [00:43,  6.23batch/s, loss=1.49e+3]


epoch 1274: avg train loss 1546.95, bar train loss 3.643, len train loss 0.035, col train loss 139.766


Epoch 1275: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 1274: avg test  loss 1555.80, bar  test loss 3.540, len  test loss 0.033, col  test loss 140.111


Epoch 1275: 272batch [00:43,  6.27batch/s, loss=1.72e+3]


epoch 1275: avg train loss 1543.02, bar train loss 3.511, len train loss 0.034, col train loss 139.944
epoch 1275: avg test  loss 1554.28, bar  test loss 3.777, len  test loss 0.037, col  test loss 141.643


Epoch 1276: 272batch [00:42,  6.34batch/s, loss=1.52e+3]


epoch 1276: avg train loss 1546.49, bar train loss 3.645, len train loss 0.035, col train loss 140.135


Epoch 1277: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1276: avg test  loss 1567.37, bar  test loss 4.760, len  test loss 0.036, col  test loss 140.503


Epoch 1277: 272batch [00:42,  6.41batch/s, loss=1.49e+3]


epoch 1277: avg train loss 1547.22, bar train loss 3.790, len train loss 0.035, col train loss 139.777


Epoch 1278: 1batch [00:00,  6.85batch/s, loss=1.52e+3]

epoch 1277: avg test  loss 1562.02, bar  test loss 3.500, len  test loss 0.034, col  test loss 141.489


Epoch 1278: 272batch [00:42,  6.40batch/s, loss=1.57e+3]


epoch 1278: avg train loss 1547.42, bar train loss 3.718, len train loss 0.036, col train loss 139.842


Epoch 1279: 0batch [00:00, ?batch/s]

epoch 1278: avg test  loss 1573.98, bar  test loss 5.423, len  test loss 0.034, col  test loss 140.712


Epoch 1279: 272batch [00:42,  6.40batch/s, loss=1.55e+3]


epoch 1279: avg train loss 1543.81, bar train loss 3.580, len train loss 0.034, col train loss 139.786


Epoch 1280: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1279: avg test  loss 1567.07, bar  test loss 4.134, len  test loss 0.041, col  test loss 141.974


Epoch 1280: 272batch [00:42,  6.43batch/s, loss=1.43e+3]


epoch 1280: avg train loss 1545.46, bar train loss 3.656, len train loss 0.036, col train loss 139.647
epoch 1280: avg test  loss 1563.23, bar  test loss 3.553, len  test loss 0.038, col  test loss 141.398


Epoch 1281: 272batch [00:41,  6.50batch/s, loss=1.52e+3]


epoch 1281: avg train loss 1543.65, bar train loss 3.498, len train loss 0.037, col train loss 139.721


Epoch 1282: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1281: avg test  loss 1562.61, bar  test loss 3.721, len  test loss 0.038, col  test loss 141.773


Epoch 1282: 272batch [00:42,  6.35batch/s, loss=1.73e+3]


epoch 1282: avg train loss 1553.16, bar train loss 4.058, len train loss 0.037, col train loss 140.264


Epoch 1283: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1282: avg test  loss 1581.31, bar  test loss 6.058, len  test loss 0.041, col  test loss 141.537


Epoch 1283: 272batch [00:42,  6.41batch/s, loss=1.54e+3]


epoch 1283: avg train loss 1547.01, bar train loss 3.641, len train loss 0.037, col train loss 140.218


Epoch 1284: 0batch [00:00, ?batch/s]

epoch 1283: avg test  loss 1563.08, bar  test loss 4.005, len  test loss 0.037, col  test loss 141.387


Epoch 1284: 272batch [00:43,  6.29batch/s, loss=1.48e+3]


epoch 1284: avg train loss 1547.04, bar train loss 3.671, len train loss 0.035, col train loss 139.957


Epoch 1285: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1284: avg test  loss 1560.49, bar  test loss 4.019, len  test loss 0.039, col  test loss 141.022


Epoch 1285: 272batch [00:41,  6.48batch/s, loss=1.58e+3]


epoch 1285: avg train loss 1546.65, bar train loss 3.710, len train loss 0.039, col train loss 139.931
epoch 1285: avg test  loss 1584.89, bar  test loss 5.765, len  test loss 0.050, col  test loss 142.342


Epoch 1286: 272batch [00:42,  6.46batch/s, loss=1.67e+3]


epoch 1286: avg train loss 1548.57, bar train loss 3.586, len train loss 0.038, col train loss 139.985


Epoch 1287: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1286: avg test  loss 1576.42, bar  test loss 4.407, len  test loss 0.038, col  test loss 141.912


Epoch 1287: 272batch [00:42,  6.46batch/s, loss=1.47e+3]


epoch 1287: avg train loss 1542.25, bar train loss 3.685, len train loss 0.034, col train loss 139.552


Epoch 1288: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 1287: avg test  loss 1554.62, bar  test loss 3.530, len  test loss 0.037, col  test loss 141.009


Epoch 1288: 272batch [00:41,  6.48batch/s, loss=1.62e+3]


epoch 1288: avg train loss 1545.95, bar train loss 3.516, len train loss 0.035, col train loss 139.948


Epoch 1289: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1288: avg test  loss 1566.83, bar  test loss 3.665, len  test loss 0.047, col  test loss 141.579


Epoch 1289: 272batch [00:42,  6.47batch/s, loss=1.61e+3]


epoch 1289: avg train loss 1546.43, bar train loss 3.575, len train loss 0.036, col train loss 139.982


Epoch 1290: 1batch [00:00,  7.25batch/s, loss=1.59e+3]

epoch 1289: avg test  loss 1574.60, bar  test loss 5.457, len  test loss 0.037, col  test loss 141.111


Epoch 1290: 272batch [00:42,  6.43batch/s, loss=1.46e+3]


epoch 1290: avg train loss 1543.98, bar train loss 3.606, len train loss 0.035, col train loss 139.698
epoch 1290: avg test  loss 1561.10, bar  test loss 3.968, len  test loss 0.039, col  test loss 140.892


Epoch 1291: 272batch [00:42,  6.38batch/s, loss=1.46e+3]


epoch 1291: avg train loss 1543.39, bar train loss 3.560, len train loss 0.035, col train loss 139.761


Epoch 1292: 0batch [00:00, ?batch/s]

epoch 1291: avg test  loss 1561.10, bar  test loss 4.052, len  test loss 0.043, col  test loss 140.512


Epoch 1292: 272batch [00:42,  6.42batch/s, loss=1.54e+3]


epoch 1292: avg train loss 1547.64, bar train loss 3.752, len train loss 0.037, col train loss 140.086


Epoch 1293: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1292: avg test  loss 1569.37, bar  test loss 4.166, len  test loss 0.036, col  test loss 141.790


Epoch 1293: 272batch [00:42,  6.45batch/s, loss=1.6e+3] 


epoch 1293: avg train loss 1548.82, bar train loss 3.700, len train loss 0.037, col train loss 140.332


Epoch 1294: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1293: avg test  loss 1569.32, bar  test loss 4.198, len  test loss 0.047, col  test loss 142.664


Epoch 1294: 272batch [00:42,  6.44batch/s, loss=1.6e+3] 


epoch 1294: avg train loss 1548.49, bar train loss 3.748, len train loss 0.036, col train loss 140.145


Epoch 1295: 0batch [00:00, ?batch/s]

epoch 1294: avg test  loss 1591.06, bar  test loss 6.753, len  test loss 0.036, col  test loss 140.583


Epoch 1295: 272batch [00:42,  6.46batch/s, loss=1.51e+3]


epoch 1295: avg train loss 1547.45, bar train loss 3.728, len train loss 0.036, col train loss 139.981
epoch 1295: avg test  loss 1576.35, bar  test loss 5.116, len  test loss 0.036, col  test loss 141.359


Epoch 1296: 272batch [00:42,  6.41batch/s, loss=1.57e+3]


epoch 1296: avg train loss 1553.57, bar train loss 4.085, len train loss 0.037, col train loss 140.360


Epoch 1297: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1296: avg test  loss 1558.98, bar  test loss 3.643, len  test loss 0.037, col  test loss 141.029


Epoch 1297: 272batch [00:42,  6.37batch/s, loss=1.55e+3]


epoch 1297: avg train loss 1550.06, bar train loss 3.551, len train loss 0.035, col train loss 140.717


Epoch 1298: 0batch [00:00, ?batch/s, loss=1.59e+3]

epoch 1297: avg test  loss 1564.63, bar  test loss 3.746, len  test loss 0.039, col  test loss 141.866


Epoch 1298: 272batch [00:42,  6.40batch/s, loss=1.61e+3]


epoch 1298: avg train loss 1547.58, bar train loss 3.573, len train loss 0.036, col train loss 140.312


Epoch 1299: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1298: avg test  loss 1561.34, bar  test loss 4.317, len  test loss 0.039, col  test loss 140.466


Epoch 1299: 272batch [00:42,  6.39batch/s, loss=1.5e+3] 


epoch 1299: avg train loss 1545.59, bar train loss 3.881, len train loss 0.037, col train loss 139.542


Epoch 1300: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 1299: avg test  loss 1559.02, bar  test loss 3.898, len  test loss 0.037, col  test loss 140.623


Epoch 1300: 272batch [00:42,  6.45batch/s, loss=1.55e+3]


epoch 1300: avg train loss 1549.48, bar train loss 3.714, len train loss 0.037, col train loss 140.505
epoch 1300: avg test  loss 1579.63, bar  test loss 5.069, len  test loss 0.037, col  test loss 142.092


Epoch 1301: 272batch [00:42,  6.38batch/s, loss=1.53e+3]


epoch 1301: avg train loss 1545.96, bar train loss 3.706, len train loss 0.036, col train loss 139.988


Epoch 1302: 1batch [00:00,  6.85batch/s, loss=1.57e+3]

epoch 1301: avg test  loss 1556.49, bar  test loss 3.586, len  test loss 0.042, col  test loss 141.197


Epoch 1302: 272batch [00:42,  6.44batch/s, loss=1.47e+3]


epoch 1302: avg train loss 1549.88, bar train loss 3.670, len train loss 0.038, col train loss 140.152


Epoch 1303: 0batch [00:00, ?batch/s, loss=1.48e+3]

epoch 1302: avg test  loss 1559.06, bar  test loss 3.850, len  test loss 0.038, col  test loss 140.937


Epoch 1303: 272batch [00:42,  6.43batch/s, loss=1.49e+3]


epoch 1303: avg train loss 1544.64, bar train loss 3.606, len train loss 0.035, col train loss 139.803


Epoch 1304: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1303: avg test  loss 1555.84, bar  test loss 3.563, len  test loss 0.039, col  test loss 140.779


Epoch 1304: 272batch [00:42,  6.34batch/s, loss=1.56e+3]


epoch 1304: avg train loss 1545.42, bar train loss 3.839, len train loss 0.036, col train loss 139.854


Epoch 1305: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1304: avg test  loss 1558.08, bar  test loss 3.587, len  test loss 0.038, col  test loss 140.631


Epoch 1305: 272batch [00:42,  6.38batch/s, loss=1.57e+3]


epoch 1305: avg train loss 1544.16, bar train loss 3.563, len train loss 0.037, col train loss 139.629
epoch 1305: avg test  loss 1567.92, bar  test loss 4.052, len  test loss 0.043, col  test loss 141.548


Epoch 1306: 272batch [00:42,  6.44batch/s, loss=1.73e+3]


epoch 1306: avg train loss 1550.08, bar train loss 3.675, len train loss 0.038, col train loss 140.212


Epoch 1307: 1batch [00:00,  7.35batch/s, loss=1.51e+3]

epoch 1306: avg test  loss 1569.89, bar  test loss 4.743, len  test loss 0.037, col  test loss 141.278


Epoch 1307: 272batch [00:42,  6.42batch/s, loss=1.5e+3] 


epoch 1307: avg train loss 1544.39, bar train loss 3.684, len train loss 0.037, col train loss 139.701


Epoch 1308: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1307: avg test  loss 1556.01, bar  test loss 3.713, len  test loss 0.044, col  test loss 139.750


Epoch 1308: 272batch [00:42,  6.41batch/s, loss=1.54e+3]


epoch 1308: avg train loss 1548.66, bar train loss 3.581, len train loss 0.038, col train loss 140.095


Epoch 1309: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 1308: avg test  loss 1569.82, bar  test loss 3.927, len  test loss 0.040, col  test loss 142.249


Epoch 1309: 272batch [00:43,  6.32batch/s, loss=1.47e+3]


epoch 1309: avg train loss 1554.30, bar train loss 3.812, len train loss 0.039, col train loss 140.433


Epoch 1310: 1batch [00:00,  7.41batch/s, loss=1.61e+3]

epoch 1309: avg test  loss 1589.73, bar  test loss 5.588, len  test loss 0.057, col  test loss 143.144


Epoch 1310: 272batch [00:42,  6.35batch/s, loss=1.47e+3]


epoch 1310: avg train loss 1546.57, bar train loss 3.512, len train loss 0.036, col train loss 140.295
epoch 1310: avg test  loss 1557.54, bar  test loss 3.626, len  test loss 0.035, col  test loss 141.493


Epoch 1311: 272batch [00:42,  6.41batch/s, loss=1.58e+3]


epoch 1311: avg train loss 1553.55, bar train loss 3.748, len train loss 0.035, col train loss 140.392


Epoch 1312: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1311: avg test  loss 1563.17, bar  test loss 3.859, len  test loss 0.040, col  test loss 141.096


Epoch 1312: 272batch [00:42,  6.43batch/s, loss=1.53e+3]


epoch 1312: avg train loss 1546.65, bar train loss 3.537, len train loss 0.036, col train loss 139.967


Epoch 1313: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 1312: avg test  loss 1560.01, bar  test loss 3.693, len  test loss 0.039, col  test loss 142.350


Epoch 1313: 272batch [00:42,  6.39batch/s, loss=1.48e+3]


epoch 1313: avg train loss 1549.01, bar train loss 3.623, len train loss 0.037, col train loss 140.634


Epoch 1314: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1313: avg test  loss 1558.32, bar  test loss 3.707, len  test loss 0.040, col  test loss 141.516


Epoch 1314: 272batch [00:42,  6.39batch/s, loss=1.65e+3]


epoch 1314: avg train loss 1550.32, bar train loss 3.717, len train loss 0.034, col train loss 140.589


Epoch 1315: 1batch [00:00,  8.06batch/s, loss=1.52e+3]

epoch 1314: avg test  loss 1566.48, bar  test loss 3.865, len  test loss 0.035, col  test loss 141.059


Epoch 1315: 272batch [00:42,  6.40batch/s, loss=1.62e+3]


epoch 1315: avg train loss 1550.51, bar train loss 3.728, len train loss 0.035, col train loss 140.296
epoch 1315: avg test  loss 1555.28, bar  test loss 3.487, len  test loss 0.037, col  test loss 140.697


Epoch 1316: 272batch [00:44,  6.13batch/s, loss=1.52e+3]


epoch 1316: avg train loss 1546.70, bar train loss 3.670, len train loss 0.037, col train loss 140.347


Epoch 1317: 1batch [00:00,  7.52batch/s, loss=1.49e+3]

epoch 1316: avg test  loss 1555.53, bar  test loss 3.566, len  test loss 0.034, col  test loss 141.685


Epoch 1317: 272batch [00:42,  6.36batch/s, loss=1.65e+3]


epoch 1317: avg train loss 1547.17, bar train loss 3.705, len train loss 0.037, col train loss 140.115


Epoch 1318: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1317: avg test  loss 1565.10, bar  test loss 3.812, len  test loss 0.035, col  test loss 141.449


Epoch 1318: 272batch [00:42,  6.42batch/s, loss=1.55e+3]


epoch 1318: avg train loss 1550.59, bar train loss 3.755, len train loss 0.035, col train loss 140.209


Epoch 1319: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 1318: avg test  loss 1564.57, bar  test loss 4.197, len  test loss 0.039, col  test loss 140.817


Epoch 1319: 272batch [00:42,  6.40batch/s, loss=1.43e+3]


epoch 1319: avg train loss 1550.54, bar train loss 3.616, len train loss 0.037, col train loss 140.765


Epoch 1320: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1319: avg test  loss 1563.30, bar  test loss 3.895, len  test loss 0.037, col  test loss 140.826


Epoch 1320: 272batch [00:42,  6.43batch/s, loss=1.54e+3]


epoch 1320: avg train loss 1551.08, bar train loss 3.741, len train loss 0.036, col train loss 140.400
epoch 1320: avg test  loss 1561.30, bar  test loss 3.784, len  test loss 0.038, col  test loss 141.906


Epoch 1321: 272batch [00:42,  6.37batch/s, loss=1.63e+3]


epoch 1321: avg train loss 1548.48, bar train loss 3.629, len train loss 0.036, col train loss 140.357


Epoch 1322: 1batch [00:00,  7.04batch/s, loss=1.54e+3]

epoch 1321: avg test  loss 1556.42, bar  test loss 3.643, len  test loss 0.039, col  test loss 142.211


Epoch 1322: 272batch [00:43,  6.32batch/s, loss=1.66e+3]


epoch 1322: avg train loss 1549.68, bar train loss 3.580, len train loss 0.036, col train loss 140.286


Epoch 1323: 0batch [00:00, ?batch/s, loss=1.66e+3]

epoch 1322: avg test  loss 1562.99, bar  test loss 4.069, len  test loss 0.036, col  test loss 140.835


Epoch 1323: 272batch [00:43,  6.28batch/s, loss=1.44e+3]


epoch 1323: avg train loss 1546.98, bar train loss 3.638, len train loss 0.035, col train loss 140.086


Epoch 1324: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1323: avg test  loss 1558.27, bar  test loss 3.605, len  test loss 0.035, col  test loss 141.032


Epoch 1324: 272batch [00:42,  6.43batch/s, loss=1.67e+3]


epoch 1324: avg train loss 1550.92, bar train loss 3.720, len train loss 0.035, col train loss 140.386


Epoch 1325: 0batch [00:00, ?batch/s, loss=1.61e+3]

epoch 1324: avg test  loss 1562.54, bar  test loss 3.912, len  test loss 0.036, col  test loss 141.755


Epoch 1325: 272batch [00:42,  6.41batch/s, loss=1.52e+3]


epoch 1325: avg train loss 1549.76, bar train loss 3.697, len train loss 0.037, col train loss 140.004
epoch 1325: avg test  loss 1566.37, bar  test loss 4.662, len  test loss 0.038, col  test loss 140.519


Epoch 1326: 272batch [00:42,  6.38batch/s, loss=1.64e+3]


epoch 1326: avg train loss 1549.25, bar train loss 3.789, len train loss 0.035, col train loss 139.990


Epoch 1327: 0batch [00:00, ?batch/s, loss=1.59e+3]

epoch 1326: avg test  loss 1568.39, bar  test loss 4.351, len  test loss 0.038, col  test loss 141.146


Epoch 1327: 272batch [00:42,  6.38batch/s, loss=1.57e+3]


epoch 1327: avg train loss 1546.29, bar train loss 3.559, len train loss 0.037, col train loss 139.931


Epoch 1328: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1327: avg test  loss 1562.94, bar  test loss 3.979, len  test loss 0.040, col  test loss 140.762


Epoch 1328: 272batch [00:42,  6.39batch/s, loss=1.61e+3]


epoch 1328: avg train loss 1544.89, bar train loss 3.591, len train loss 0.038, col train loss 140.010


Epoch 1329: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1328: avg test  loss 1565.63, bar  test loss 4.274, len  test loss 0.041, col  test loss 142.154


Epoch 1329: 272batch [00:43,  6.22batch/s, loss=1.6e+3] 


epoch 1329: avg train loss 1550.60, bar train loss 3.858, len train loss 0.038, col train loss 140.257


Epoch 1330: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1329: avg test  loss 1564.59, bar  test loss 4.346, len  test loss 0.035, col  test loss 141.713


Epoch 1330: 272batch [00:43,  6.25batch/s, loss=1.45e+3]


epoch 1330: avg train loss 1550.90, bar train loss 3.621, len train loss 0.037, col train loss 140.548
epoch 1330: avg test  loss 1564.58, bar  test loss 3.939, len  test loss 0.038, col  test loss 141.601


Epoch 1331: 272batch [00:42,  6.38batch/s, loss=1.42e+3]


epoch 1331: avg train loss 1552.94, bar train loss 3.688, len train loss 0.036, col train loss 140.333


Epoch 1332: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1331: avg test  loss 1567.11, bar  test loss 3.808, len  test loss 0.035, col  test loss 141.538


Epoch 1332: 272batch [00:42,  6.38batch/s, loss=1.55e+3]


epoch 1332: avg train loss 1557.04, bar train loss 3.991, len train loss 0.034, col train loss 140.528


Epoch 1333: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1332: avg test  loss 1558.67, bar  test loss 3.535, len  test loss 0.033, col  test loss 140.692


Epoch 1333: 272batch [00:42,  6.36batch/s, loss=1.56e+3]


epoch 1333: avg train loss 1552.63, bar train loss 3.672, len train loss 0.035, col train loss 140.669


Epoch 1334: 1batch [00:00,  6.94batch/s, loss=1.48e+3]

epoch 1333: avg test  loss 1558.88, bar  test loss 3.816, len  test loss 0.039, col  test loss 141.397


Epoch 1334: 272batch [00:42,  6.38batch/s, loss=1.5e+3] 


epoch 1334: avg train loss 1552.57, bar train loss 3.646, len train loss 0.038, col train loss 141.030


Epoch 1335: 1batch [00:00,  7.25batch/s, loss=1.59e+3]

epoch 1334: avg test  loss 1563.99, bar  test loss 3.708, len  test loss 0.035, col  test loss 141.761


Epoch 1335: 272batch [00:42,  6.35batch/s, loss=1.52e+3]


epoch 1335: avg train loss 1552.51, bar train loss 3.812, len train loss 0.037, col train loss 140.603
epoch 1335: avg test  loss 1564.99, bar  test loss 3.706, len  test loss 0.038, col  test loss 141.046


Epoch 1336: 272batch [00:43,  6.32batch/s, loss=1.59e+3]


epoch 1336: avg train loss 1551.11, bar train loss 3.648, len train loss 0.035, col train loss 140.672


Epoch 1337: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1336: avg test  loss 1575.48, bar  test loss 4.319, len  test loss 0.044, col  test loss 142.005


Epoch 1337: 272batch [00:43,  6.23batch/s, loss=1.36e+3]


epoch 1337: avg train loss 1558.24, bar train loss 3.950, len train loss 0.038, col train loss 141.228


Epoch 1338: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1337: avg test  loss 1578.20, bar  test loss 4.859, len  test loss 0.046, col  test loss 141.424


Epoch 1338: 272batch [00:43,  6.30batch/s, loss=1.54e+3]


epoch 1338: avg train loss 1560.16, bar train loss 4.445, len train loss 0.036, col train loss 140.590


Epoch 1339: 1batch [00:00,  7.75batch/s, loss=1.57e+3]

epoch 1338: avg test  loss 1578.06, bar  test loss 5.536, len  test loss 0.038, col  test loss 140.729


Epoch 1339: 272batch [00:43,  6.32batch/s, loss=1.41e+3]


epoch 1339: avg train loss 1548.97, bar train loss 3.584, len train loss 0.036, col train loss 139.987


Epoch 1340: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 1339: avg test  loss 1559.19, bar  test loss 3.535, len  test loss 0.036, col  test loss 141.313


Epoch 1340: 272batch [00:43,  6.31batch/s, loss=1.57e+3]


epoch 1340: avg train loss 1552.97, bar train loss 3.726, len train loss 0.036, col train loss 140.626
epoch 1340: avg test  loss 1613.27, bar  test loss 7.602, len  test loss 0.041, col  test loss 142.607


Epoch 1341: 272batch [00:43,  6.32batch/s, loss=1.61e+3]


epoch 1341: avg train loss 1553.11, bar train loss 3.683, len train loss 0.037, col train loss 140.588


Epoch 1342: 0batch [00:00, ?batch/s, loss=1.66e+3]

epoch 1341: avg test  loss 1564.62, bar  test loss 3.535, len  test loss 0.038, col  test loss 142.150


Epoch 1342: 272batch [00:43,  6.23batch/s, loss=1.52e+3]


epoch 1342: avg train loss 1547.55, bar train loss 3.545, len train loss 0.036, col train loss 139.769


Epoch 1343: 0batch [00:00, ?batch/s]

epoch 1342: avg test  loss 1563.13, bar  test loss 4.016, len  test loss 0.040, col  test loss 141.822


Epoch 1343: 272batch [00:43,  6.25batch/s, loss=1.75e+3]


epoch 1343: avg train loss 1554.68, bar train loss 3.722, len train loss 0.034, col train loss 140.652


Epoch 1344: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1343: avg test  loss 1562.23, bar  test loss 3.585, len  test loss 0.037, col  test loss 140.866


Epoch 1344: 272batch [00:43,  6.27batch/s, loss=1.55e+3]


epoch 1344: avg train loss 1554.06, bar train loss 3.570, len train loss 0.036, col train loss 140.799


Epoch 1345: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1344: avg test  loss 1563.95, bar  test loss 3.733, len  test loss 0.042, col  test loss 141.953


Epoch 1345: 272batch [00:43,  6.31batch/s, loss=1.74e+3]


epoch 1345: avg train loss 1555.73, bar train loss 3.626, len train loss 0.035, col train loss 140.995
epoch 1345: avg test  loss 1568.40, bar  test loss 3.926, len  test loss 0.033, col  test loss 141.471


Epoch 1346: 272batch [00:43,  6.27batch/s, loss=1.5e+3] 


epoch 1346: avg train loss 1553.74, bar train loss 3.730, len train loss 0.035, col train loss 140.628


Epoch 1347: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1346: avg test  loss 1563.18, bar  test loss 3.809, len  test loss 0.042, col  test loss 141.519


Epoch 1347: 272batch [00:42,  6.36batch/s, loss=1.63e+3]


epoch 1347: avg train loss 1550.89, bar train loss 3.628, len train loss 0.035, col train loss 140.656


Epoch 1348: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1347: avg test  loss 1561.76, bar  test loss 3.701, len  test loss 0.040, col  test loss 141.641


Epoch 1348: 272batch [00:43,  6.28batch/s, loss=1.51e+3]


epoch 1348: avg train loss 1552.03, bar train loss 3.818, len train loss 0.037, col train loss 140.548


Epoch 1349: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1348: avg test  loss 1568.95, bar  test loss 4.168, len  test loss 0.053, col  test loss 142.800


Epoch 1349: 272batch [00:43,  6.25batch/s, loss=1.58e+3]


epoch 1349: avg train loss 1555.23, bar train loss 3.664, len train loss 0.041, col train loss 140.907


Epoch 1350: 0batch [00:00, ?batch/s, loss=1.59e+3]

epoch 1349: avg test  loss 1567.64, bar  test loss 3.998, len  test loss 0.040, col  test loss 141.707


Epoch 1350: 272batch [00:43,  6.21batch/s, loss=1.6e+3] 


epoch 1350: avg train loss 1558.06, bar train loss 3.830, len train loss 0.038, col train loss 141.014
epoch 1350: avg test  loss 1582.09, bar  test loss 4.871, len  test loss 0.038, col  test loss 141.369


Epoch 1351: 272batch [00:43,  6.31batch/s, loss=1.54e+3]


epoch 1351: avg train loss 1556.96, bar train loss 3.694, len train loss 0.036, col train loss 141.127


Epoch 1352: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1351: avg test  loss 1567.41, bar  test loss 3.960, len  test loss 0.036, col  test loss 141.162


Epoch 1352: 272batch [00:43,  6.32batch/s, loss=1.58e+3]


epoch 1352: avg train loss 1555.88, bar train loss 3.659, len train loss 0.039, col train loss 141.055


Epoch 1353: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1352: avg test  loss 1561.72, bar  test loss 3.659, len  test loss 0.041, col  test loss 141.912


Epoch 1353: 272batch [00:43,  6.31batch/s, loss=1.85e+3]


epoch 1353: avg train loss 1556.13, bar train loss 3.767, len train loss 0.039, col train loss 141.181


Epoch 1354: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1353: avg test  loss 1580.88, bar  test loss 4.098, len  test loss 0.048, col  test loss 143.829


Epoch 1354: 272batch [00:43,  6.29batch/s, loss=1.51e+3]


epoch 1354: avg train loss 1555.90, bar train loss 3.580, len train loss 0.038, col train loss 141.247


Epoch 1355: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1354: avg test  loss 1570.06, bar  test loss 3.724, len  test loss 0.038, col  test loss 142.346


Epoch 1355: 272batch [00:43,  6.26batch/s, loss=1.56e+3]


epoch 1355: avg train loss 1554.67, bar train loss 3.531, len train loss 0.035, col train loss 141.099
epoch 1355: avg test  loss 1572.40, bar  test loss 4.493, len  test loss 0.036, col  test loss 142.480


Epoch 1356: 272batch [00:44,  6.18batch/s, loss=1.55e+3]


epoch 1356: avg train loss 1558.50, bar train loss 3.928, len train loss 0.034, col train loss 140.960


Epoch 1357: 1batch [00:00,  7.75batch/s, loss=1.6e+3]

epoch 1356: avg test  loss 1580.86, bar  test loss 4.613, len  test loss 0.037, col  test loss 142.237


Epoch 1357: 272batch [00:43,  6.20batch/s, loss=1.6e+3] 


epoch 1357: avg train loss 1557.36, bar train loss 3.661, len train loss 0.036, col train loss 141.116


Epoch 1358: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 1357: avg test  loss 1563.96, bar  test loss 3.578, len  test loss 0.036, col  test loss 142.097


Epoch 1358: 272batch [00:43,  6.31batch/s, loss=1.78e+3]


epoch 1358: avg train loss 1555.68, bar train loss 3.761, len train loss 0.035, col train loss 141.005


Epoch 1359: 0batch [00:00, ?batch/s]

epoch 1358: avg test  loss 1563.73, bar  test loss 3.608, len  test loss 0.034, col  test loss 141.848


Epoch 1359: 272batch [00:43,  6.24batch/s, loss=1.62e+3]


epoch 1359: avg train loss 1560.13, bar train loss 4.070, len train loss 0.036, col train loss 140.890


Epoch 1360: 0batch [00:00, ?batch/s, loss=1.6e+3]

epoch 1359: avg test  loss 1614.47, bar  test loss 8.978, len  test loss 0.037, col  test loss 141.470


Epoch 1360: 272batch [00:43,  6.29batch/s, loss=1.71e+3]


epoch 1360: avg train loss 1556.65, bar train loss 3.978, len train loss 0.036, col train loss 140.906
epoch 1360: avg test  loss 1566.48, bar  test loss 3.704, len  test loss 0.038, col  test loss 143.592


Epoch 1361: 272batch [00:43,  6.26batch/s, loss=1.58e+3]


epoch 1361: avg train loss 1553.04, bar train loss 3.783, len train loss 0.036, col train loss 140.751


Epoch 1362: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1361: avg test  loss 1558.32, bar  test loss 3.645, len  test loss 0.037, col  test loss 140.922


Epoch 1362: 272batch [00:43,  6.29batch/s, loss=1.64e+3]


epoch 1362: avg train loss 1551.95, bar train loss 3.609, len train loss 0.034, col train loss 140.759


Epoch 1363: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1362: avg test  loss 1569.26, bar  test loss 4.089, len  test loss 0.033, col  test loss 141.651


Epoch 1363: 272batch [00:43,  6.21batch/s, loss=1.46e+3]


epoch 1363: avg train loss 1558.07, bar train loss 3.771, len train loss 0.035, col train loss 141.513


Epoch 1364: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 1363: avg test  loss 1567.48, bar  test loss 4.279, len  test loss 0.034, col  test loss 141.476


Epoch 1364: 272batch [00:43,  6.25batch/s, loss=1.63e+3]


epoch 1364: avg train loss 1556.22, bar train loss 3.646, len train loss 0.036, col train loss 140.992


Epoch 1365: 0batch [00:00, ?batch/s]

epoch 1364: avg test  loss 1563.31, bar  test loss 3.658, len  test loss 0.043, col  test loss 141.446


Epoch 1365: 272batch [00:43,  6.26batch/s, loss=1.57e+3]


epoch 1365: avg train loss 1561.47, bar train loss 4.057, len train loss 0.038, col train loss 141.246
epoch 1365: avg test  loss 1565.11, bar  test loss 3.591, len  test loss 0.037, col  test loss 142.340


Epoch 1366: 272batch [00:43,  6.23batch/s, loss=1.76e+3]


epoch 1366: avg train loss 1554.47, bar train loss 3.790, len train loss 0.035, col train loss 140.930


Epoch 1367: 0batch [00:00, ?batch/s, loss=1.61e+3]

epoch 1366: avg test  loss 1567.06, bar  test loss 3.951, len  test loss 0.037, col  test loss 142.395


Epoch 1367: 272batch [00:43,  6.27batch/s, loss=1.52e+3]


epoch 1367: avg train loss 1556.39, bar train loss 3.671, len train loss 0.035, col train loss 141.196


Epoch 1368: 0batch [00:00, ?batch/s, loss=1.6e+3]

epoch 1367: avg test  loss 1569.83, bar  test loss 3.738, len  test loss 0.038, col  test loss 142.803


Epoch 1368: 272batch [00:43,  6.23batch/s, loss=1.54e+3]


epoch 1368: avg train loss 1556.39, bar train loss 3.653, len train loss 0.036, col train loss 141.486


Epoch 1369: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1368: avg test  loss 1566.70, bar  test loss 3.788, len  test loss 0.040, col  test loss 143.645


Epoch 1369: 272batch [00:44,  6.18batch/s, loss=1.58e+3]


epoch 1369: avg train loss 1557.18, bar train loss 3.742, len train loss 0.036, col train loss 141.396


Epoch 1370: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1369: avg test  loss 1573.39, bar  test loss 4.445, len  test loss 0.041, col  test loss 142.122


Epoch 1370: 272batch [00:44,  6.07batch/s, loss=1.5e+3] 


epoch 1370: avg train loss 1560.82, bar train loss 3.892, len train loss 0.035, col train loss 141.223
epoch 1370: avg test  loss 1575.46, bar  test loss 3.849, len  test loss 0.045, col  test loss 143.069


Epoch 1371: 272batch [00:43,  6.23batch/s, loss=1.51e+3]


epoch 1371: avg train loss 1555.23, bar train loss 3.635, len train loss 0.036, col train loss 141.022


Epoch 1372: 0batch [00:00, ?batch/s, loss=1.6e+3]

epoch 1371: avg test  loss 1571.22, bar  test loss 4.362, len  test loss 0.042, col  test loss 141.699


Epoch 1372: 272batch [00:43,  6.23batch/s, loss=1.66e+3]


epoch 1372: avg train loss 1556.27, bar train loss 3.892, len train loss 0.036, col train loss 140.950


Epoch 1373: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1372: avg test  loss 1562.59, bar  test loss 3.709, len  test loss 0.034, col  test loss 141.751


Epoch 1373: 272batch [00:43,  6.26batch/s, loss=1.59e+3]


epoch 1373: avg train loss 1552.75, bar train loss 3.576, len train loss 0.034, col train loss 140.827


Epoch 1374: 0batch [00:00, ?batch/s, loss=1.59e+3]

epoch 1373: avg test  loss 1557.46, bar  test loss 3.592, len  test loss 0.038, col  test loss 141.264


Epoch 1374: 272batch [00:43,  6.27batch/s, loss=1.46e+3]


epoch 1374: avg train loss 1551.64, bar train loss 3.633, len train loss 0.035, col train loss 140.970


Epoch 1375: 0batch [00:00, ?batch/s]

epoch 1374: avg test  loss 1564.63, bar  test loss 3.649, len  test loss 0.037, col  test loss 142.837


Epoch 1375: 272batch [00:43,  6.22batch/s, loss=1.71e+3]


epoch 1375: avg train loss 1553.83, bar train loss 3.691, len train loss 0.037, col train loss 141.146
epoch 1375: avg test  loss 1571.92, bar  test loss 4.267, len  test loss 0.034, col  test loss 142.107


Epoch 1376: 272batch [00:44,  6.17batch/s, loss=1.69e+3]


epoch 1376: avg train loss 1558.17, bar train loss 3.642, len train loss 0.036, col train loss 141.326


Epoch 1377: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1376: avg test  loss 1582.46, bar  test loss 4.771, len  test loss 0.037, col  test loss 141.875


Epoch 1377: 272batch [00:44,  6.17batch/s, loss=1.61e+3]


epoch 1377: avg train loss 1557.89, bar train loss 3.756, len train loss 0.035, col train loss 141.098


Epoch 1378: 1batch [00:00,  7.63batch/s, loss=1.57e+3]

epoch 1377: avg test  loss 1584.19, bar  test loss 6.015, len  test loss 0.036, col  test loss 141.713


Epoch 1378: 272batch [00:43,  6.22batch/s, loss=1.53e+3]


epoch 1378: avg train loss 1557.57, bar train loss 3.776, len train loss 0.036, col train loss 141.110


Epoch 1379: 0batch [00:00, ?batch/s, loss=1.63e+3]

epoch 1378: avg test  loss 1573.61, bar  test loss 3.894, len  test loss 0.038, col  test loss 143.393


Epoch 1379: 272batch [00:43,  6.21batch/s, loss=1.72e+3]


epoch 1379: avg train loss 1560.19, bar train loss 3.776, len train loss 0.038, col train loss 141.258


Epoch 1380: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1379: avg test  loss 1578.13, bar  test loss 3.953, len  test loss 0.045, col  test loss 143.859


Epoch 1380: 272batch [00:43,  6.22batch/s, loss=1.45e+3]


epoch 1380: avg train loss 1558.93, bar train loss 3.703, len train loss 0.038, col train loss 141.249
epoch 1380: avg test  loss 1567.18, bar  test loss 3.950, len  test loss 0.039, col  test loss 141.560


Epoch 1381: 272batch [00:44,  6.16batch/s, loss=1.73e+3]


epoch 1381: avg train loss 1558.85, bar train loss 3.678, len train loss 0.036, col train loss 141.434


Epoch 1382: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1381: avg test  loss 1620.28, bar  test loss 8.766, len  test loss 0.036, col  test loss 142.519


Epoch 1382: 272batch [00:44,  6.14batch/s, loss=1.59e+3]


epoch 1382: avg train loss 1561.06, bar train loss 3.922, len train loss 0.036, col train loss 141.497


Epoch 1383: 0batch [00:00, ?batch/s, loss=1.44e+3]

epoch 1382: avg test  loss 1568.88, bar  test loss 3.803, len  test loss 0.039, col  test loss 142.032


Epoch 1383: 272batch [00:43,  6.21batch/s, loss=1.64e+3]


epoch 1383: avg train loss 1555.22, bar train loss 3.642, len train loss 0.037, col train loss 141.286


Epoch 1384: 1batch [00:00,  7.69batch/s, loss=1.61e+3]

epoch 1383: avg test  loss 1653.46, bar  test loss 11.167, len  test loss 0.041, col  test loss 142.685


Epoch 1384: 272batch [00:43,  6.23batch/s, loss=1.51e+3]


epoch 1384: avg train loss 1564.73, bar train loss 4.419, len train loss 0.036, col train loss 141.250


Epoch 1385: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 1384: avg test  loss 1566.15, bar  test loss 3.764, len  test loss 0.039, col  test loss 143.200


Epoch 1385: 272batch [00:43,  6.24batch/s, loss=1.62e+3]


epoch 1385: avg train loss 1559.43, bar train loss 3.842, len train loss 0.038, col train loss 141.175
epoch 1385: avg test  loss 1583.14, bar  test loss 4.253, len  test loss 0.037, col  test loss 142.911


Epoch 1386: 272batch [00:43,  6.24batch/s, loss=1.52e+3]


epoch 1386: avg train loss 1562.63, bar train loss 3.808, len train loss 0.037, col train loss 141.461


Epoch 1387: 0batch [00:00, ?batch/s, loss=1.6e+3]

epoch 1386: avg test  loss 1571.70, bar  test loss 3.835, len  test loss 0.037, col  test loss 142.946


Epoch 1387: 272batch [00:44,  6.07batch/s, loss=1.44e+3]


epoch 1387: avg train loss 1557.24, bar train loss 3.823, len train loss 0.035, col train loss 140.848


Epoch 1388: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1387: avg test  loss 1561.19, bar  test loss 3.895, len  test loss 0.035, col  test loss 141.176


Epoch 1388: 272batch [00:43,  6.22batch/s, loss=1.49e+3]


epoch 1388: avg train loss 1556.27, bar train loss 3.721, len train loss 0.035, col train loss 141.288


Epoch 1389: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1388: avg test  loss 1572.85, bar  test loss 3.719, len  test loss 0.036, col  test loss 142.813


Epoch 1389: 272batch [00:44,  6.17batch/s, loss=1.7e+3] 


epoch 1389: avg train loss 1564.14, bar train loss 3.948, len train loss 0.036, col train loss 141.486


Epoch 1390: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1389: avg test  loss 1579.95, bar  test loss 4.768, len  test loss 0.037, col  test loss 142.424


Epoch 1390: 272batch [00:44,  6.17batch/s, loss=1.69e+3]


epoch 1390: avg train loss 1557.83, bar train loss 3.797, len train loss 0.036, col train loss 141.479
epoch 1390: avg test  loss 1573.33, bar  test loss 3.999, len  test loss 0.038, col  test loss 143.803


Epoch 1391: 272batch [00:43,  6.21batch/s, loss=1.55e+3]


epoch 1391: avg train loss 1560.08, bar train loss 3.832, len train loss 0.035, col train loss 141.697


Epoch 1392: 0batch [00:00, ?batch/s, loss=1.64e+3]

epoch 1391: avg test  loss 1574.09, bar  test loss 4.251, len  test loss 0.041, col  test loss 142.115


Epoch 1392: 272batch [00:43,  6.20batch/s, loss=1.76e+3]


epoch 1392: avg train loss 1560.05, bar train loss 3.596, len train loss 0.037, col train loss 141.455


Epoch 1393: 0batch [00:00, ?batch/s, loss=1.59e+3]

epoch 1392: avg test  loss 1573.34, bar  test loss 4.316, len  test loss 0.037, col  test loss 142.477


Epoch 1393: 272batch [00:45,  6.03batch/s, loss=1.55e+3]


epoch 1393: avg train loss 1563.27, bar train loss 3.836, len train loss 0.036, col train loss 141.179


Epoch 1394: 0batch [00:00, ?batch/s, loss=1.66e+3]

epoch 1393: avg test  loss 1578.26, bar  test loss 3.820, len  test loss 0.047, col  test loss 142.367


Epoch 1394: 272batch [00:45,  6.03batch/s, loss=1.43e+3]


epoch 1394: avg train loss 1559.94, bar train loss 3.614, len train loss 0.035, col train loss 141.235


Epoch 1395: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1394: avg test  loss 1583.29, bar  test loss 4.805, len  test loss 0.039, col  test loss 141.799


Epoch 1395: 272batch [00:44,  6.16batch/s, loss=1.71e+3]


epoch 1395: avg train loss 1556.19, bar train loss 3.609, len train loss 0.035, col train loss 141.165
epoch 1395: avg test  loss 1570.61, bar  test loss 4.055, len  test loss 0.044, col  test loss 142.777


Epoch 1396: 272batch [00:44,  6.15batch/s, loss=1.68e+3]


epoch 1396: avg train loss 1557.98, bar train loss 3.747, len train loss 0.038, col train loss 141.417


Epoch 1397: 0batch [00:00, ?batch/s]

epoch 1396: avg test  loss 1568.69, bar  test loss 3.739, len  test loss 0.037, col  test loss 140.723


Epoch 1397: 272batch [00:44,  6.15batch/s, loss=1.55e+3]


epoch 1397: avg train loss 1557.51, bar train loss 3.783, len train loss 0.037, col train loss 140.883


Epoch 1398: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1397: avg test  loss 1584.76, bar  test loss 5.651, len  test loss 0.039, col  test loss 141.889


Epoch 1398: 272batch [00:44,  6.14batch/s, loss=1.63e+3]


epoch 1398: avg train loss 1557.16, bar train loss 3.778, len train loss 0.036, col train loss 141.178


Epoch 1399: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1398: avg test  loss 1571.46, bar  test loss 4.013, len  test loss 0.047, col  test loss 141.805


Epoch 1399: 272batch [00:44,  6.06batch/s, loss=1.43e+3]


epoch 1399: avg train loss 1555.89, bar train loss 3.665, len train loss 0.038, col train loss 141.301


Epoch 1400: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1399: avg test  loss 1567.66, bar  test loss 4.095, len  test loss 0.040, col  test loss 141.947


Epoch 1400: 272batch [00:44,  6.09batch/s, loss=1.55e+3]


epoch 1400: avg train loss 1557.84, bar train loss 3.708, len train loss 0.036, col train loss 141.089
epoch 1400: avg test  loss 1566.55, bar  test loss 4.099, len  test loss 0.034, col  test loss 141.181


Epoch 1401: 272batch [00:44,  6.15batch/s, loss=1.65e+3]


epoch 1401: avg train loss 1556.02, bar train loss 3.588, len train loss 0.035, col train loss 140.944


Epoch 1402: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1401: avg test  loss 1570.78, bar  test loss 3.572, len  test loss 0.043, col  test loss 141.726


Epoch 1402: 272batch [00:43,  6.19batch/s, loss=1.47e+3]


epoch 1402: avg train loss 1559.31, bar train loss 4.007, len train loss 0.035, col train loss 141.275


Epoch 1403: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 1402: avg test  loss 1568.20, bar  test loss 3.802, len  test loss 0.038, col  test loss 142.392


Epoch 1403: 272batch [00:43,  6.20batch/s, loss=1.52e+3]


epoch 1403: avg train loss 1557.03, bar train loss 3.860, len train loss 0.035, col train loss 141.211


Epoch 1404: 0batch [00:00, ?batch/s, loss=1.65e+3]

epoch 1403: avg test  loss 1656.11, bar  test loss 12.749, len  test loss 0.038, col  test loss 142.675


Epoch 1404: 272batch [00:43,  6.18batch/s, loss=1.68e+3]


epoch 1404: avg train loss 1569.91, bar train loss 4.944, len train loss 0.037, col train loss 141.335


Epoch 1405: 0batch [00:00, ?batch/s, loss=1.69e+3]

epoch 1404: avg test  loss 1604.58, bar  test loss 6.391, len  test loss 0.074, col  test loss 143.634


Epoch 1405: 272batch [00:45,  5.98batch/s, loss=1.55e+3]


epoch 1405: avg train loss 1559.00, bar train loss 3.657, len train loss 0.039, col train loss 141.617
epoch 1405: avg test  loss 1568.24, bar  test loss 3.750, len  test loss 0.040, col  test loss 143.070


Epoch 1406: 272batch [00:44,  6.08batch/s, loss=1.59e+3]


epoch 1406: avg train loss 1563.21, bar train loss 4.139, len train loss 0.036, col train loss 141.625


Epoch 1407: 0batch [00:00, ?batch/s]

epoch 1406: avg test  loss 1575.52, bar  test loss 4.497, len  test loss 0.041, col  test loss 143.698


Epoch 1407: 272batch [00:44,  6.15batch/s, loss=1.48e+3]


epoch 1407: avg train loss 1555.99, bar train loss 3.642, len train loss 0.035, col train loss 141.156


Epoch 1408: 0batch [00:00, ?batch/s, loss=1.51e+3]

epoch 1407: avg test  loss 1576.89, bar  test loss 4.069, len  test loss 0.036, col  test loss 142.970


Epoch 1408: 272batch [00:44,  6.18batch/s, loss=1.55e+3]


epoch 1408: avg train loss 1558.57, bar train loss 3.681, len train loss 0.035, col train loss 141.630


Epoch 1409: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1408: avg test  loss 1585.92, bar  test loss 4.107, len  test loss 0.058, col  test loss 144.279


Epoch 1409: 272batch [00:44,  6.17batch/s, loss=1.5e+3] 


epoch 1409: avg train loss 1560.03, bar train loss 3.853, len train loss 0.039, col train loss 141.600


Epoch 1410: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1409: avg test  loss 1569.92, bar  test loss 4.152, len  test loss 0.039, col  test loss 141.506


Epoch 1410: 272batch [00:45,  5.94batch/s, loss=1.55e+3]


epoch 1410: avg train loss 1561.29, bar train loss 3.962, len train loss 0.035, col train loss 141.146
epoch 1410: avg test  loss 1592.83, bar  test loss 6.146, len  test loss 0.038, col  test loss 142.114


Epoch 1411: 272batch [00:45,  5.96batch/s, loss=1.54e+3]


epoch 1411: avg train loss 1555.64, bar train loss 3.614, len train loss 0.035, col train loss 141.209


Epoch 1412: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1411: avg test  loss 1575.16, bar  test loss 4.323, len  test loss 0.040, col  test loss 142.559


Epoch 1412: 272batch [00:45,  5.95batch/s, loss=1.61e+3]


epoch 1412: avg train loss 1557.16, bar train loss 3.722, len train loss 0.035, col train loss 141.425


Epoch 1413: 0batch [00:00, ?batch/s, loss=1.62e+3]

epoch 1412: avg test  loss 1602.46, bar  test loss 6.170, len  test loss 0.037, col  test loss 142.933


Epoch 1413: 272batch [00:44,  6.14batch/s, loss=1.64e+3]


epoch 1413: avg train loss 1558.83, bar train loss 3.854, len train loss 0.038, col train loss 141.297


Epoch 1414: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1413: avg test  loss 1580.78, bar  test loss 4.957, len  test loss 0.041, col  test loss 141.837


Epoch 1414: 272batch [00:43,  6.19batch/s, loss=1.67e+3]


epoch 1414: avg train loss 1556.26, bar train loss 3.836, len train loss 0.036, col train loss 141.023


Epoch 1415: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 1414: avg test  loss 1580.90, bar  test loss 4.462, len  test loss 0.045, col  test loss 142.925


Epoch 1415: 272batch [00:44,  6.15batch/s, loss=1.47e+3]


epoch 1415: avg train loss 1566.21, bar train loss 3.820, len train loss 0.037, col train loss 141.813
epoch 1415: avg test  loss 1567.84, bar  test loss 3.640, len  test loss 0.036, col  test loss 141.975


Epoch 1416: 272batch [00:44,  6.15batch/s, loss=1.61e+3]


epoch 1416: avg train loss 1560.27, bar train loss 3.605, len train loss 0.037, col train loss 141.756


Epoch 1417: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1416: avg test  loss 1578.22, bar  test loss 4.131, len  test loss 0.041, col  test loss 143.578


Epoch 1417: 272batch [00:44,  6.11batch/s, loss=1.62e+3]


epoch 1417: avg train loss 1559.17, bar train loss 3.641, len train loss 0.035, col train loss 141.271


Epoch 1418: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1417: avg test  loss 1565.24, bar  test loss 3.675, len  test loss 0.036, col  test loss 142.335


Epoch 1418: 272batch [00:44,  6.05batch/s, loss=1.59e+3]


epoch 1418: avg train loss 1560.50, bar train loss 3.732, len train loss 0.036, col train loss 141.536


Epoch 1419: 0batch [00:00, ?batch/s, loss=1.59e+3]

epoch 1418: avg test  loss 1586.54, bar  test loss 5.010, len  test loss 0.038, col  test loss 142.084


Epoch 1419: 272batch [00:45,  6.02batch/s, loss=1.54e+3]


epoch 1419: avg train loss 1563.38, bar train loss 4.001, len train loss 0.038, col train loss 141.274


Epoch 1420: 0batch [00:00, ?batch/s]

epoch 1419: avg test  loss 1562.50, bar  test loss 3.728, len  test loss 0.036, col  test loss 142.232


Epoch 1420: 272batch [00:44,  6.13batch/s, loss=1.53e+3]


epoch 1420: avg train loss 1562.87, bar train loss 3.928, len train loss 0.037, col train loss 141.755
epoch 1420: avg test  loss 1578.49, bar  test loss 4.088, len  test loss 0.040, col  test loss 145.160


Epoch 1421: 272batch [00:44,  6.10batch/s, loss=1.52e+3]


epoch 1421: avg train loss 1564.38, bar train loss 3.783, len train loss 0.038, col train loss 142.065


Epoch 1422: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1421: avg test  loss 1569.76, bar  test loss 3.641, len  test loss 0.038, col  test loss 142.615


Epoch 1422: 272batch [00:45,  5.97batch/s, loss=1.62e+3]


epoch 1422: avg train loss 1562.95, bar train loss 3.706, len train loss 0.036, col train loss 141.805


Epoch 1423: 0batch [00:00, ?batch/s]

epoch 1422: avg test  loss 1580.71, bar  test loss 3.955, len  test loss 0.041, col  test loss 143.043


Epoch 1423: 272batch [00:45,  5.98batch/s, loss=1.5e+3] 


epoch 1423: avg train loss 1565.53, bar train loss 3.724, len train loss 0.046, col train loss 142.289


Epoch 1424: 0batch [00:00, ?batch/s, loss=1.59e+3]

epoch 1423: avg test  loss 1574.62, bar  test loss 3.880, len  test loss 0.035, col  test loss 142.006


Epoch 1424: 272batch [00:44,  6.10batch/s, loss=1.63e+3]


epoch 1424: avg train loss 1560.95, bar train loss 3.650, len train loss 0.035, col train loss 141.402


Epoch 1425: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1424: avg test  loss 1583.61, bar  test loss 5.351, len  test loss 0.036, col  test loss 142.003


Epoch 1425: 272batch [00:44,  6.13batch/s, loss=1.56e+3]


epoch 1425: avg train loss 1562.09, bar train loss 3.795, len train loss 0.035, col train loss 141.456
epoch 1425: avg test  loss 1573.83, bar  test loss 4.489, len  test loss 0.040, col  test loss 142.173


Epoch 1426: 272batch [00:44,  6.12batch/s, loss=1.53e+3]


epoch 1426: avg train loss 1559.73, bar train loss 3.842, len train loss 0.039, col train loss 141.555


Epoch 1427: 1batch [00:00,  7.75batch/s, loss=1.52e+3]

epoch 1426: avg test  loss 1568.02, bar  test loss 3.821, len  test loss 0.039, col  test loss 142.156


Epoch 1427: 272batch [00:44,  6.06batch/s, loss=1.5e+3] 


epoch 1427: avg train loss 1561.69, bar train loss 3.728, len train loss 0.036, col train loss 141.793


Epoch 1428: 0batch [00:00, ?batch/s]

epoch 1427: avg test  loss 1571.98, bar  test loss 3.737, len  test loss 0.042, col  test loss 141.738


Epoch 1428: 272batch [00:45,  6.01batch/s, loss=1.43e+3]


epoch 1428: avg train loss 1563.04, bar train loss 3.598, len train loss 0.036, col train loss 141.952


Epoch 1429: 0batch [00:00, ?batch/s]

epoch 1428: avg test  loss 1583.89, bar  test loss 4.608, len  test loss 0.038, col  test loss 142.752


Epoch 1429: 272batch [00:45,  5.95batch/s, loss=1.6e+3] 


epoch 1429: avg train loss 1565.00, bar train loss 3.895, len train loss 0.038, col train loss 141.695


Epoch 1430: 0batch [00:00, ?batch/s, loss=1.59e+3]

epoch 1429: avg test  loss 1568.28, bar  test loss 3.655, len  test loss 0.038, col  test loss 142.205


Epoch 1430: 272batch [00:44,  6.13batch/s, loss=1.46e+3]


epoch 1430: avg train loss 1564.39, bar train loss 3.805, len train loss 0.039, col train loss 142.077
epoch 1430: avg test  loss 1575.40, bar  test loss 3.809, len  test loss 0.050, col  test loss 143.598


Epoch 1431: 272batch [00:44,  6.05batch/s, loss=1.65e+3]


epoch 1431: avg train loss 1562.37, bar train loss 3.761, len train loss 0.037, col train loss 141.992


Epoch 1432: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1431: avg test  loss 1567.07, bar  test loss 4.121, len  test loss 0.037, col  test loss 142.610


Epoch 1432: 272batch [00:45,  6.02batch/s, loss=1.39e+3]


epoch 1432: avg train loss 1564.65, bar train loss 4.059, len train loss 0.038, col train loss 141.816


Epoch 1433: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1432: avg test  loss 1568.21, bar  test loss 3.751, len  test loss 0.037, col  test loss 141.864


Epoch 1433: 272batch [00:45,  5.98batch/s, loss=1.54e+3]


epoch 1433: avg train loss 1564.92, bar train loss 3.788, len train loss 0.039, col train loss 141.916


Epoch 1434: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1433: avg test  loss 1582.75, bar  test loss 4.211, len  test loss 0.046, col  test loss 143.010


Epoch 1434: 272batch [00:44,  6.08batch/s, loss=1.59e+3]


epoch 1434: avg train loss 1562.82, bar train loss 3.704, len train loss 0.039, col train loss 142.220


Epoch 1435: 0batch [00:00, ?batch/s, loss=1.6e+3]

epoch 1434: avg test  loss 1573.06, bar  test loss 4.065, len  test loss 0.043, col  test loss 143.356


Epoch 1435: 272batch [00:44,  6.15batch/s, loss=1.6e+3] 


epoch 1435: avg train loss 1565.71, bar train loss 3.769, len train loss 0.041, col train loss 142.082
epoch 1435: avg test  loss 1577.24, bar  test loss 4.008, len  test loss 0.036, col  test loss 143.490


Epoch 1436: 272batch [00:44,  6.05batch/s, loss=1.67e+3]


epoch 1436: avg train loss 1562.60, bar train loss 3.766, len train loss 0.036, col train loss 141.824


Epoch 1437: 0batch [00:00, ?batch/s, loss=1.48e+3]

epoch 1436: avg test  loss 1569.46, bar  test loss 3.631, len  test loss 0.043, col  test loss 143.091


Epoch 1437: 272batch [00:44,  6.11batch/s, loss=1.64e+3]


epoch 1437: avg train loss 1561.83, bar train loss 3.760, len train loss 0.036, col train loss 141.608


Epoch 1438: 0batch [00:00, ?batch/s]

epoch 1437: avg test  loss 1572.90, bar  test loss 3.665, len  test loss 0.039, col  test loss 143.725


Epoch 1438: 272batch [00:44,  6.09batch/s, loss=1.54e+3]


epoch 1438: avg train loss 1561.19, bar train loss 3.577, len train loss 0.035, col train loss 142.162


Epoch 1439: 0batch [00:00, ?batch/s]

epoch 1438: avg test  loss 1577.39, bar  test loss 4.325, len  test loss 0.043, col  test loss 143.204


Epoch 1439: 272batch [00:44,  6.08batch/s, loss=1.58e+3]


epoch 1439: avg train loss 1566.65, bar train loss 3.946, len train loss 0.038, col train loss 142.473


Epoch 1440: 0batch [00:00, ?batch/s, loss=1.62e+3]

epoch 1439: avg test  loss 1571.22, bar  test loss 3.888, len  test loss 0.046, col  test loss 142.468


Epoch 1440: 272batch [00:45,  5.98batch/s, loss=1.62e+3]


epoch 1440: avg train loss 1561.07, bar train loss 3.776, len train loss 0.036, col train loss 141.612
epoch 1440: avg test  loss 1575.94, bar  test loss 3.946, len  test loss 0.048, col  test loss 143.703


Epoch 1441: 272batch [00:46,  5.89batch/s, loss=1.69e+3]


epoch 1441: avg train loss 1569.74, bar train loss 3.898, len train loss 0.038, col train loss 142.792


Epoch 1442: 0batch [00:00, ?batch/s, loss=1.65e+3]

epoch 1441: avg test  loss 1595.36, bar  test loss 5.160, len  test loss 0.041, col  test loss 143.013


Epoch 1442: 272batch [00:45,  6.01batch/s, loss=1.64e+3]


epoch 1442: avg train loss 1567.76, bar train loss 3.688, len train loss 0.037, col train loss 141.801


Epoch 1443: 0batch [00:00, ?batch/s, loss=1.5e+3]

epoch 1442: avg test  loss 1578.20, bar  test loss 4.102, len  test loss 0.040, col  test loss 142.163


Epoch 1443: 272batch [00:45,  6.01batch/s, loss=1.49e+3]


epoch 1443: avg train loss 1565.67, bar train loss 3.766, len train loss 0.038, col train loss 141.713


Epoch 1444: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1443: avg test  loss 1570.31, bar  test loss 3.524, len  test loss 0.038, col  test loss 141.672


Epoch 1444: 272batch [00:45,  6.04batch/s, loss=1.54e+3]


epoch 1444: avg train loss 1564.13, bar train loss 3.747, len train loss 0.037, col train loss 141.555


Epoch 1445: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1444: avg test  loss 1573.77, bar  test loss 3.668, len  test loss 0.037, col  test loss 143.456


Epoch 1445: 272batch [00:44,  6.08batch/s, loss=1.46e+3]


epoch 1445: avg train loss 1564.34, bar train loss 3.681, len train loss 0.036, col train loss 142.104
epoch 1445: avg test  loss 1575.00, bar  test loss 3.715, len  test loss 0.035, col  test loss 143.372


Epoch 1446: 272batch [00:45,  6.01batch/s, loss=1.69e+3]


epoch 1446: avg train loss 1564.42, bar train loss 3.731, len train loss 0.036, col train loss 142.411


Epoch 1447: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1446: avg test  loss 1569.06, bar  test loss 3.711, len  test loss 0.038, col  test loss 142.257


Epoch 1447: 272batch [00:45,  5.93batch/s, loss=1.72e+3]


epoch 1447: avg train loss 1561.39, bar train loss 3.665, len train loss 0.035, col train loss 142.079


Epoch 1448: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1447: avg test  loss 1604.87, bar  test loss 7.091, len  test loss 0.037, col  test loss 142.801


Epoch 1448: 272batch [00:45,  6.00batch/s, loss=1.6e+3] 


epoch 1448: avg train loss 1563.44, bar train loss 3.820, len train loss 0.037, col train loss 142.111


Epoch 1449: 0batch [00:00, ?batch/s, loss=1.64e+3]

epoch 1448: avg test  loss 1593.00, bar  test loss 4.402, len  test loss 0.039, col  test loss 144.064


Epoch 1449: 272batch [00:44,  6.07batch/s, loss=1.53e+3]


epoch 1449: avg train loss 1571.81, bar train loss 4.254, len train loss 0.042, col train loss 142.088


Epoch 1450: 0batch [00:00, ?batch/s, loss=1.46e+3]

epoch 1449: avg test  loss 1567.79, bar  test loss 3.802, len  test loss 0.042, col  test loss 143.069


Epoch 1450: 272batch [00:44,  6.10batch/s, loss=1.52e+3]


epoch 1450: avg train loss 1562.89, bar train loss 3.617, len train loss 0.036, col train loss 141.936
epoch 1450: avg test  loss 1590.83, bar  test loss 5.136, len  test loss 0.037, col  test loss 142.497


Epoch 1451: 272batch [00:45,  5.92batch/s, loss=1.57e+3]


epoch 1451: avg train loss 1564.57, bar train loss 3.820, len train loss 0.037, col train loss 141.845


Epoch 1452: 0batch [00:00, ?batch/s, loss=1.49e+3]

epoch 1451: avg test  loss 1586.69, bar  test loss 4.414, len  test loss 0.045, col  test loss 142.950


Epoch 1452: 272batch [00:46,  5.85batch/s, loss=1.75e+3]


epoch 1452: avg train loss 1572.00, bar train loss 4.143, len train loss 0.038, col train loss 142.357


Epoch 1453: 0batch [00:00, ?batch/s]

epoch 1452: avg test  loss 1573.96, bar  test loss 3.968, len  test loss 0.037, col  test loss 143.035


Epoch 1453: 272batch [00:45,  5.93batch/s, loss=1.56e+3]


epoch 1453: avg train loss 1558.53, bar train loss 3.574, len train loss 0.036, col train loss 141.695


Epoch 1454: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1453: avg test  loss 1576.91, bar  test loss 3.666, len  test loss 0.037, col  test loss 142.842


Epoch 1454: 272batch [00:44,  6.09batch/s, loss=1.58e+3]


epoch 1454: avg train loss 1563.38, bar train loss 3.725, len train loss 0.036, col train loss 142.047


Epoch 1455: 0batch [00:00, ?batch/s]

epoch 1454: avg test  loss 1571.98, bar  test loss 4.419, len  test loss 0.040, col  test loss 142.886


Epoch 1455: 272batch [00:45,  6.04batch/s, loss=1.51e+3]


epoch 1455: avg train loss 1562.26, bar train loss 3.869, len train loss 0.036, col train loss 141.951
epoch 1455: avg test  loss 1577.30, bar  test loss 3.831, len  test loss 0.036, col  test loss 143.037


Epoch 1456: 272batch [00:46,  5.88batch/s, loss=1.54e+3]


epoch 1456: avg train loss 1565.98, bar train loss 3.869, len train loss 0.036, col train loss 141.997


Epoch 1457: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1456: avg test  loss 1575.87, bar  test loss 3.926, len  test loss 0.038, col  test loss 142.544


Epoch 1457: 272batch [00:45,  5.97batch/s, loss=1.54e+3]


epoch 1457: avg train loss 1563.66, bar train loss 3.743, len train loss 0.037, col train loss 142.015


Epoch 1458: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1457: avg test  loss 1587.88, bar  test loss 4.101, len  test loss 0.039, col  test loss 144.583


Epoch 1458: 272batch [00:45,  6.02batch/s, loss=1.65e+3]


epoch 1458: avg train loss 1561.20, bar train loss 3.767, len train loss 0.036, col train loss 141.818


Epoch 1459: 0batch [00:00, ?batch/s, loss=1.63e+3]

epoch 1458: avg test  loss 1582.83, bar  test loss 4.591, len  test loss 0.036, col  test loss 142.396


Epoch 1459: 272batch [00:45,  6.03batch/s, loss=1.51e+3]


epoch 1459: avg train loss 1565.94, bar train loss 4.034, len train loss 0.040, col train loss 142.097


Epoch 1460: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1459: avg test  loss 1580.98, bar  test loss 4.258, len  test loss 0.049, col  test loss 143.818


Epoch 1460: 272batch [00:45,  6.03batch/s, loss=1.64e+3]


epoch 1460: avg train loss 1567.56, bar train loss 3.697, len train loss 0.039, col train loss 142.212
epoch 1460: avg test  loss 1593.82, bar  test loss 4.274, len  test loss 0.039, col  test loss 143.821


Epoch 1461: 272batch [00:45,  6.00batch/s, loss=1.47e+3]


epoch 1461: avg train loss 1563.63, bar train loss 3.687, len train loss 0.036, col train loss 141.820


Epoch 1462: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1461: avg test  loss 1583.34, bar  test loss 4.139, len  test loss 0.041, col  test loss 143.996


Epoch 1462: 272batch [00:45,  6.01batch/s, loss=1.48e+3]


epoch 1462: avg train loss 1569.71, bar train loss 3.814, len train loss 0.042, col train loss 142.584


Epoch 1463: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1462: avg test  loss 1581.89, bar  test loss 4.128, len  test loss 0.047, col  test loss 143.121


Epoch 1463: 272batch [00:46,  5.88batch/s, loss=1.52e+3]


epoch 1463: avg train loss 1569.56, bar train loss 3.859, len train loss 0.039, col train loss 142.607


Epoch 1464: 0batch [00:00, ?batch/s, loss=1.5e+3]

epoch 1463: avg test  loss 1578.65, bar  test loss 4.053, len  test loss 0.037, col  test loss 143.623


Epoch 1464: 272batch [00:45,  6.01batch/s, loss=1.65e+3]


epoch 1464: avg train loss 1569.47, bar train loss 4.115, len train loss 0.035, col train loss 142.584


Epoch 1465: 0batch [00:00, ?batch/s, loss=1.64e+3]

epoch 1464: avg test  loss 1592.46, bar  test loss 4.138, len  test loss 0.046, col  test loss 144.801


Epoch 1465: 272batch [00:45,  5.99batch/s, loss=1.57e+3]


epoch 1465: avg train loss 1564.89, bar train loss 3.789, len train loss 0.037, col train loss 142.206
epoch 1465: avg test  loss 1573.42, bar  test loss 3.757, len  test loss 0.039, col  test loss 144.081


Epoch 1466: 272batch [00:45,  5.93batch/s, loss=1.58e+3]


epoch 1466: avg train loss 1565.59, bar train loss 3.753, len train loss 0.036, col train loss 142.433


Epoch 1467: 1batch [00:00,  6.71batch/s, loss=1.6e+3]

epoch 1466: avg test  loss 1574.45, bar  test loss 3.776, len  test loss 0.038, col  test loss 143.013


Epoch 1467: 272batch [00:46,  5.88batch/s, loss=1.66e+3]


epoch 1467: avg train loss 1570.03, bar train loss 3.813, len train loss 0.037, col train loss 142.789


Epoch 1468: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1467: avg test  loss 1576.10, bar  test loss 3.842, len  test loss 0.037, col  test loss 143.096


Epoch 1468: 272batch [00:46,  5.89batch/s, loss=1.69e+3]


epoch 1468: avg train loss 1566.49, bar train loss 3.797, len train loss 0.038, col train loss 142.041


Epoch 1469: 0batch [00:00, ?batch/s]

epoch 1468: avg test  loss 1584.27, bar  test loss 4.704, len  test loss 0.036, col  test loss 142.715


Epoch 1469: 272batch [00:45,  5.94batch/s, loss=1.64e+3]


epoch 1469: avg train loss 1563.17, bar train loss 3.635, len train loss 0.036, col train loss 142.309


Epoch 1470: 0batch [00:00, ?batch/s, loss=1.62e+3]

epoch 1469: avg test  loss 1576.51, bar  test loss 4.103, len  test loss 0.039, col  test loss 143.301


Epoch 1470: 272batch [00:45,  5.94batch/s, loss=1.54e+3]


epoch 1470: avg train loss 1565.53, bar train loss 3.894, len train loss 0.037, col train loss 142.287
epoch 1470: avg test  loss 1579.48, bar  test loss 3.967, len  test loss 0.039, col  test loss 143.590


Epoch 1471: 272batch [00:46,  5.91batch/s, loss=1.71e+3]


epoch 1471: avg train loss 1568.89, bar train loss 3.826, len train loss 0.037, col train loss 142.447


Epoch 1472: 0batch [00:00, ?batch/s, loss=1.63e+3]

epoch 1471: avg test  loss 1577.70, bar  test loss 3.850, len  test loss 0.044, col  test loss 144.047


Epoch 1472: 272batch [00:46,  5.87batch/s, loss=1.51e+3]


epoch 1472: avg train loss 1570.83, bar train loss 3.919, len train loss 0.036, col train loss 142.837


Epoch 1473: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1472: avg test  loss 1579.31, bar  test loss 4.040, len  test loss 0.037, col  test loss 143.460


Epoch 1473: 272batch [00:46,  5.84batch/s, loss=1.47e+3]


epoch 1473: avg train loss 1567.36, bar train loss 3.859, len train loss 0.036, col train loss 142.304


Epoch 1474: 0batch [00:00, ?batch/s, loss=1.63e+3]

epoch 1473: avg test  loss 1579.58, bar  test loss 3.740, len  test loss 0.040, col  test loss 144.556


Epoch 1474: 272batch [00:46,  5.80batch/s, loss=1.56e+3]


epoch 1474: avg train loss 1569.35, bar train loss 3.916, len train loss 0.036, col train loss 142.777


Epoch 1475: 0batch [00:00, ?batch/s]

epoch 1474: avg test  loss 1580.30, bar  test loss 3.731, len  test loss 0.034, col  test loss 143.407


Epoch 1475: 272batch [00:45,  5.94batch/s, loss=1.58e+3]


epoch 1475: avg train loss 1571.08, bar train loss 4.040, len train loss 0.036, col train loss 142.492
epoch 1475: avg test  loss 1570.99, bar  test loss 3.761, len  test loss 0.039, col  test loss 142.877


Epoch 1476: 272batch [00:46,  5.87batch/s, loss=1.62e+3]


epoch 1476: avg train loss 1564.02, bar train loss 3.609, len train loss 0.036, col train loss 141.958


Epoch 1477: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1476: avg test  loss 1578.35, bar  test loss 4.100, len  test loss 0.037, col  test loss 143.283


Epoch 1477: 272batch [00:45,  5.93batch/s, loss=1.55e+3]


epoch 1477: avg train loss 1565.55, bar train loss 3.730, len train loss 0.035, col train loss 142.424


Epoch 1478: 0batch [00:00, ?batch/s, loss=1.61e+3]

epoch 1477: avg test  loss 1581.22, bar  test loss 4.104, len  test loss 0.040, col  test loss 143.809


Epoch 1478: 272batch [00:46,  5.89batch/s, loss=1.73e+3]


epoch 1478: avg train loss 1567.83, bar train loss 3.964, len train loss 0.038, col train loss 142.400


Epoch 1479: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1478: avg test  loss 1579.63, bar  test loss 4.034, len  test loss 0.040, col  test loss 143.918


Epoch 1479: 272batch [00:45,  5.92batch/s, loss=1.69e+3]


epoch 1479: avg train loss 1578.82, bar train loss 3.964, len train loss 0.041, col train loss 143.095


Epoch 1480: 0batch [00:00, ?batch/s]

epoch 1479: avg test  loss 1601.56, bar  test loss 4.930, len  test loss 0.044, col  test loss 145.321


Epoch 1480: 272batch [00:46,  5.84batch/s, loss=1.68e+3]


epoch 1480: avg train loss 1578.08, bar train loss 4.420, len train loss 0.037, col train loss 142.464
epoch 1480: avg test  loss 1575.58, bar  test loss 3.825, len  test loss 0.035, col  test loss 143.090


Epoch 1481: 272batch [00:49,  5.47batch/s, loss=1.52e+3]


epoch 1481: avg train loss 1566.74, bar train loss 3.723, len train loss 0.035, col train loss 142.181


Epoch 1482: 0batch [00:00, ?batch/s]

epoch 1481: avg test  loss 1586.39, bar  test loss 3.814, len  test loss 0.042, col  test loss 144.781


Epoch 1482: 272batch [00:47,  5.67batch/s, loss=1.72e+3]


epoch 1482: avg train loss 1569.98, bar train loss 3.934, len train loss 0.038, col train loss 142.415


Epoch 1483: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1482: avg test  loss 1605.41, bar  test loss 6.666, len  test loss 0.046, col  test loss 143.481


Epoch 1483: 272batch [00:48,  5.56batch/s, loss=1.49e+3]


epoch 1483: avg train loss 1567.94, bar train loss 3.996, len train loss 0.037, col train loss 142.006


Epoch 1484: 0batch [00:00, ?batch/s, loss=1.62e+3]

epoch 1483: avg test  loss 1579.82, bar  test loss 4.110, len  test loss 0.038, col  test loss 142.883


Epoch 1484: 272batch [00:48,  5.64batch/s, loss=1.65e+3]


epoch 1484: avg train loss 1567.65, bar train loss 3.868, len train loss 0.035, col train loss 142.272


Epoch 1485: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1484: avg test  loss 1570.54, bar  test loss 3.679, len  test loss 0.037, col  test loss 143.033


Epoch 1485: 272batch [00:48,  5.60batch/s, loss=1.6e+3] 


epoch 1485: avg train loss 1565.13, bar train loss 3.656, len train loss 0.037, col train loss 141.789
epoch 1485: avg test  loss 1588.69, bar  test loss 4.613, len  test loss 0.039, col  test loss 143.493


Epoch 1486: 272batch [00:52,  5.15batch/s, loss=1.64e+3]


epoch 1486: avg train loss 1570.01, bar train loss 3.825, len train loss 0.036, col train loss 142.509
epoch 1486: avg test  loss 1579.27, bar  test loss 3.784, len  test loss 0.044, col  test loss 144.178


Epoch 1487: 272batch [00:48,  5.55batch/s, loss=1.58e+3]


epoch 1487: avg train loss 1566.44, bar train loss 3.771, len train loss 0.037, col train loss 142.388


Epoch 1488: 0batch [00:00, ?batch/s]

epoch 1487: avg test  loss 1577.24, bar  test loss 3.941, len  test loss 0.037, col  test loss 143.035


Epoch 1488: 272batch [00:49,  5.49batch/s, loss=1.68e+3]


epoch 1488: avg train loss 1579.83, bar train loss 4.094, len train loss 0.036, col train loss 143.469


Epoch 1489: 0batch [00:00, ?batch/s]

epoch 1488: avg test  loss 1580.51, bar  test loss 3.771, len  test loss 0.035, col  test loss 143.478


Epoch 1489: 272batch [00:48,  5.56batch/s, loss=1.74e+3]


epoch 1489: avg train loss 1575.25, bar train loss 3.856, len train loss 0.040, col train loss 143.027


Epoch 1490: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1489: avg test  loss 1580.94, bar  test loss 4.010, len  test loss 0.038, col  test loss 143.806


Epoch 1490: 272batch [00:48,  5.61batch/s, loss=1.6e+3] 


epoch 1490: avg train loss 1572.96, bar train loss 3.880, len train loss 0.040, col train loss 143.087
epoch 1490: avg test  loss 1582.02, bar  test loss 3.992, len  test loss 0.048, col  test loss 143.924


Epoch 1491: 272batch [00:48,  5.59batch/s, loss=1.49e+3]


epoch 1491: avg train loss 1573.34, bar train loss 3.957, len train loss 0.039, col train loss 142.696


Epoch 1492: 0batch [00:00, ?batch/s, loss=1.62e+3]

epoch 1491: avg test  loss 1599.08, bar  test loss 5.117, len  test loss 0.040, col  test loss 142.555


Epoch 1492: 272batch [00:47,  5.69batch/s, loss=1.61e+3]


epoch 1492: avg train loss 1572.40, bar train loss 3.966, len train loss 0.036, col train loss 142.365


Epoch 1493: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1492: avg test  loss 1585.19, bar  test loss 4.054, len  test loss 0.040, col  test loss 143.432


Epoch 1493: 272batch [00:48,  5.63batch/s, loss=1.71e+3]


epoch 1493: avg train loss 1573.63, bar train loss 3.800, len train loss 0.037, col train loss 142.601


Epoch 1494: 0batch [00:00, ?batch/s]

epoch 1493: avg test  loss 1581.31, bar  test loss 4.267, len  test loss 0.040, col  test loss 142.918


Epoch 1494: 272batch [00:48,  5.62batch/s, loss=1.52e+3]


epoch 1494: avg train loss 1567.03, bar train loss 3.641, len train loss 0.036, col train loss 142.620


Epoch 1495: 0batch [00:00, ?batch/s]

epoch 1494: avg test  loss 1589.96, bar  test loss 5.067, len  test loss 0.038, col  test loss 142.604


Epoch 1495: 272batch [00:49,  5.54batch/s, loss=1.69e+3]


epoch 1495: avg train loss 1571.92, bar train loss 4.163, len train loss 0.038, col train loss 142.402
epoch 1495: avg test  loss 1587.20, bar  test loss 4.127, len  test loss 0.040, col  test loss 142.254


Epoch 1496: 272batch [00:49,  5.48batch/s, loss=1.57e+3]


epoch 1496: avg train loss 1567.41, bar train loss 3.845, len train loss 0.039, col train loss 142.456


Epoch 1497: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1496: avg test  loss 1578.72, bar  test loss 3.892, len  test loss 0.056, col  test loss 143.436


Epoch 1497: 272batch [00:48,  5.64batch/s, loss=1.6e+3] 


epoch 1497: avg train loss 1569.00, bar train loss 3.791, len train loss 0.040, col train loss 142.770


Epoch 1498: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1497: avg test  loss 1584.88, bar  test loss 4.264, len  test loss 0.037, col  test loss 144.782


Epoch 1498: 272batch [00:48,  5.61batch/s, loss=1.58e+3]


epoch 1498: avg train loss 1571.16, bar train loss 3.826, len train loss 0.037, col train loss 142.672


Epoch 1499: 0batch [00:00, ?batch/s]

epoch 1498: avg test  loss 1656.77, bar  test loss 11.213, len  test loss 0.038, col  test loss 144.098


Epoch 1499: 272batch [00:48,  5.63batch/s, loss=1.66e+3]


epoch 1499: avg train loss 1569.82, bar train loss 4.037, len train loss 0.037, col train loss 142.526


Epoch 1500: 0batch [00:00, ?batch/s]

epoch 1499: avg test  loss 1577.17, bar  test loss 3.721, len  test loss 0.039, col  test loss 144.745


Epoch 1500: 272batch [00:48,  5.61batch/s, loss=1.49e+3]


epoch 1500: avg train loss 1567.47, bar train loss 3.613, len train loss 0.035, col train loss 142.819
epoch 1500: avg test  loss 1580.26, bar  test loss 3.827, len  test loss 0.035, col  test loss 142.946


Epoch 1501: 272batch [00:49,  5.52batch/s, loss=1.6e+3] 


epoch 1501: avg train loss 1575.28, bar train loss 4.335, len train loss 0.038, col train loss 142.258


Epoch 1502: 0batch [00:00, ?batch/s]

epoch 1501: avg test  loss 1576.36, bar  test loss 3.788, len  test loss 0.041, col  test loss 142.560


Epoch 1502: 272batch [00:50,  5.39batch/s, loss=1.69e+3]


epoch 1502: avg train loss 1565.08, bar train loss 3.943, len train loss 0.036, col train loss 141.732


Epoch 1503: 0batch [00:00, ?batch/s]

epoch 1502: avg test  loss 1590.66, bar  test loss 5.657, len  test loss 0.038, col  test loss 143.637


Epoch 1503: 272batch [00:48,  5.59batch/s, loss=1.59e+3]


epoch 1503: avg train loss 1569.67, bar train loss 4.092, len train loss 0.036, col train loss 142.530


Epoch 1504: 0batch [00:00, ?batch/s]

epoch 1503: avg test  loss 1578.44, bar  test loss 4.157, len  test loss 0.047, col  test loss 142.852


Epoch 1504: 272batch [00:48,  5.60batch/s, loss=1.61e+3]


epoch 1504: avg train loss 1568.42, bar train loss 3.852, len train loss 0.040, col train loss 142.708


Epoch 1505: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1504: avg test  loss 1572.26, bar  test loss 4.035, len  test loss 0.037, col  test loss 142.794


Epoch 1505: 272batch [00:48,  5.61batch/s, loss=1.41e+3]


epoch 1505: avg train loss 1567.37, bar train loss 3.811, len train loss 0.038, col train loss 142.498
epoch 1505: avg test  loss 1576.29, bar  test loss 3.618, len  test loss 0.038, col  test loss 144.031


Epoch 1506: 272batch [00:49,  5.50batch/s, loss=1.78e+3]


epoch 1506: avg train loss 1570.43, bar train loss 3.790, len train loss 0.037, col train loss 142.779


Epoch 1507: 0batch [00:00, ?batch/s]

epoch 1506: avg test  loss 1575.54, bar  test loss 3.769, len  test loss 0.039, col  test loss 143.447


Epoch 1507: 272batch [00:50,  5.44batch/s, loss=1.66e+3]


epoch 1507: avg train loss 1571.97, bar train loss 3.817, len train loss 0.038, col train loss 142.454


Epoch 1508: 0batch [00:00, ?batch/s]

epoch 1507: avg test  loss 1580.47, bar  test loss 4.172, len  test loss 0.039, col  test loss 142.697


Epoch 1508: 272batch [00:48,  5.57batch/s, loss=1.61e+3]


epoch 1508: avg train loss 1570.66, bar train loss 4.110, len train loss 0.037, col train loss 142.397


Epoch 1509: 0batch [00:00, ?batch/s, loss=1.59e+3]

epoch 1508: avg test  loss 1586.81, bar  test loss 4.514, len  test loss 0.058, col  test loss 143.906


Epoch 1509: 272batch [00:48,  5.59batch/s, loss=1.53e+3]


epoch 1509: avg train loss 1574.61, bar train loss 3.941, len train loss 0.042, col train loss 142.797


Epoch 1510: 0batch [00:00, ?batch/s]

epoch 1509: avg test  loss 1583.78, bar  test loss 4.126, len  test loss 0.042, col  test loss 143.130


Epoch 1510: 272batch [00:48,  5.60batch/s, loss=1.56e+3]


epoch 1510: avg train loss 1571.53, bar train loss 4.167, len train loss 0.040, col train loss 142.537
epoch 1510: avg test  loss 1577.50, bar  test loss 4.201, len  test loss 0.040, col  test loss 142.549


Epoch 1511: 272batch [00:48,  5.61batch/s, loss=1.48e+3]


epoch 1511: avg train loss 1567.90, bar train loss 3.794, len train loss 0.035, col train loss 142.090


Epoch 1512: 0batch [00:00, ?batch/s]

epoch 1511: avg test  loss 1581.12, bar  test loss 4.166, len  test loss 0.037, col  test loss 144.081


Epoch 1512: 272batch [00:49,  5.49batch/s, loss=1.66e+3]


epoch 1512: avg train loss 1567.92, bar train loss 3.777, len train loss 0.036, col train loss 142.252


Epoch 1513: 0batch [00:00, ?batch/s]

epoch 1512: avg test  loss 1593.49, bar  test loss 5.555, len  test loss 0.036, col  test loss 143.378


Epoch 1513: 272batch [00:49,  5.47batch/s, loss=1.54e+3]


epoch 1513: avg train loss 1569.50, bar train loss 3.792, len train loss 0.036, col train loss 142.699


Epoch 1514: 0batch [00:00, ?batch/s]

epoch 1513: avg test  loss 1586.64, bar  test loss 4.305, len  test loss 0.041, col  test loss 144.002


Epoch 1514: 272batch [00:49,  5.54batch/s, loss=1.66e+3]


epoch 1514: avg train loss 1569.56, bar train loss 3.727, len train loss 0.036, col train loss 142.775


Epoch 1515: 0batch [00:00, ?batch/s]

epoch 1514: avg test  loss 1580.54, bar  test loss 4.109, len  test loss 0.041, col  test loss 144.160


Epoch 1515: 272batch [00:49,  5.52batch/s, loss=1.51e+3]


epoch 1515: avg train loss 1569.08, bar train loss 3.800, len train loss 0.038, col train loss 142.678
epoch 1515: avg test  loss 1595.45, bar  test loss 5.956, len  test loss 0.038, col  test loss 142.821


Epoch 1516: 272batch [00:49,  5.54batch/s, loss=1.71e+3]


epoch 1516: avg train loss 1565.10, bar train loss 3.852, len train loss 0.037, col train loss 142.146


Epoch 1517: 0batch [00:00, ?batch/s]

epoch 1516: avg test  loss 1593.83, bar  test loss 4.365, len  test loss 0.045, col  test loss 142.969


Epoch 1517: 272batch [00:49,  5.48batch/s, loss=1.65e+3]


epoch 1517: avg train loss 1574.80, bar train loss 3.776, len train loss 0.035, col train loss 143.389


Epoch 1518: 0batch [00:00, ?batch/s]

epoch 1517: avg test  loss 1578.98, bar  test loss 3.635, len  test loss 0.037, col  test loss 143.746


Epoch 1518: 272batch [00:50,  5.39batch/s, loss=1.56e+3]


epoch 1518: avg train loss 1571.52, bar train loss 3.729, len train loss 0.037, col train loss 143.356


Epoch 1519: 0batch [00:00, ?batch/s]

epoch 1518: avg test  loss 1576.56, bar  test loss 3.846, len  test loss 0.042, col  test loss 143.664


Epoch 1519: 272batch [00:48,  5.57batch/s, loss=1.51e+3]


epoch 1519: avg train loss 1580.03, bar train loss 4.715, len train loss 0.038, col train loss 143.084


Epoch 1520: 0batch [00:00, ?batch/s]

epoch 1519: avg test  loss 1590.17, bar  test loss 4.241, len  test loss 0.037, col  test loss 144.424


Epoch 1520: 272batch [00:48,  5.59batch/s, loss=1.79e+3]


epoch 1520: avg train loss 1573.71, bar train loss 3.733, len train loss 0.038, col train loss 142.999
epoch 1520: avg test  loss 1579.63, bar  test loss 3.928, len  test loss 0.045, col  test loss 144.116


Epoch 1521: 272batch [00:49,  5.52batch/s, loss=1.63e+3]


epoch 1521: avg train loss 1571.84, bar train loss 3.936, len train loss 0.038, col train loss 142.615


Epoch 1522: 0batch [00:00, ?batch/s]

epoch 1521: avg test  loss 1593.34, bar  test loss 4.851, len  test loss 0.049, col  test loss 144.108


Epoch 1522: 272batch [00:48,  5.55batch/s, loss=1.79e+3]


epoch 1522: avg train loss 1582.68, bar train loss 3.969, len train loss 0.042, col train loss 143.551


Epoch 1523: 0batch [00:00, ?batch/s]

epoch 1522: avg test  loss 1590.55, bar  test loss 4.085, len  test loss 0.046, col  test loss 144.370


Epoch 1523: 272batch [00:49,  5.47batch/s, loss=1.59e+3]


epoch 1523: avg train loss 1577.59, bar train loss 3.780, len train loss 0.037, col train loss 143.116


Epoch 1524: 0batch [00:00, ?batch/s]

epoch 1523: avg test  loss 1589.94, bar  test loss 4.410, len  test loss 0.038, col  test loss 144.172


Epoch 1524: 272batch [00:50,  5.42batch/s, loss=1.65e+3]


epoch 1524: avg train loss 1577.37, bar train loss 4.151, len train loss 0.037, col train loss 143.334


Epoch 1525: 0batch [00:00, ?batch/s]

epoch 1524: avg test  loss 1584.51, bar  test loss 4.051, len  test loss 0.040, col  test loss 144.826


Epoch 1525: 272batch [00:49,  5.50batch/s, loss=1.59e+3]


epoch 1525: avg train loss 1573.40, bar train loss 3.679, len train loss 0.037, col train loss 143.415
epoch 1525: avg test  loss 1598.05, bar  test loss 4.311, len  test loss 0.044, col  test loss 145.502


Epoch 1526: 272batch [00:49,  5.55batch/s, loss=1.59e+3]


epoch 1526: avg train loss 1574.35, bar train loss 3.832, len train loss 0.038, col train loss 143.411


Epoch 1527: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1526: avg test  loss 1592.61, bar  test loss 4.531, len  test loss 0.036, col  test loss 143.587


Epoch 1527: 272batch [00:49,  5.49batch/s, loss=1.66e+3]


epoch 1527: avg train loss 1574.89, bar train loss 4.027, len train loss 0.036, col train loss 142.524


Epoch 1528: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1527: avg test  loss 1579.08, bar  test loss 4.126, len  test loss 0.038, col  test loss 142.527


Epoch 1528: 272batch [00:48,  5.62batch/s, loss=1.67e+3]


epoch 1528: avg train loss 1571.64, bar train loss 3.848, len train loss 0.036, col train loss 142.698


Epoch 1529: 0batch [00:00, ?batch/s, loss=1.65e+3]

epoch 1528: avg test  loss 1589.16, bar  test loss 4.377, len  test loss 0.040, col  test loss 144.489


Epoch 1529: 272batch [00:49,  5.47batch/s, loss=1.52e+3]


epoch 1529: avg train loss 1575.37, bar train loss 3.963, len train loss 0.038, col train loss 143.137


Epoch 1530: 0batch [00:00, ?batch/s]

epoch 1529: avg test  loss 1585.02, bar  test loss 3.790, len  test loss 0.039, col  test loss 143.897


Epoch 1530: 272batch [00:51,  5.28batch/s, loss=1.7e+3] 


epoch 1530: avg train loss 1574.92, bar train loss 3.782, len train loss 0.039, col train loss 142.735
epoch 1530: avg test  loss 1585.73, bar  test loss 4.165, len  test loss 0.038, col  test loss 143.974


Epoch 1531: 272batch [00:50,  5.41batch/s, loss=1.57e+3]


epoch 1531: avg train loss 1572.52, bar train loss 3.772, len train loss 0.037, col train loss 143.213


Epoch 1532: 0batch [00:00, ?batch/s]

epoch 1531: avg test  loss 1584.48, bar  test loss 4.285, len  test loss 0.045, col  test loss 144.475


Epoch 1532: 272batch [00:49,  5.48batch/s, loss=1.37e+3]


epoch 1532: avg train loss 1570.88, bar train loss 3.805, len train loss 0.039, col train loss 142.929


Epoch 1533: 0batch [00:00, ?batch/s]

epoch 1532: avg test  loss 1584.03, bar  test loss 4.148, len  test loss 0.040, col  test loss 144.082


Epoch 1533: 272batch [00:50,  5.40batch/s, loss=1.61e+3]


epoch 1533: avg train loss 1598.41, bar train loss 5.993, len train loss 0.038, col train loss 143.307


Epoch 1534: 0batch [00:00, ?batch/s]

epoch 1533: avg test  loss 1713.46, bar  test loss 16.196, len  test loss 0.038, col  test loss 143.126


Epoch 1534: 272batch [00:50,  5.34batch/s, loss=1.61e+3]


epoch 1534: avg train loss 1587.61, bar train loss 5.598, len train loss 0.037, col train loss 143.080


Epoch 1535: 0batch [00:00, ?batch/s]

epoch 1534: avg test  loss 1575.42, bar  test loss 3.752, len  test loss 0.038, col  test loss 144.210


Epoch 1535: 272batch [00:51,  5.30batch/s, loss=1.6e+3] 


epoch 1535: avg train loss 1570.55, bar train loss 3.761, len train loss 0.039, col train loss 142.565
epoch 1535: avg test  loss 1596.68, bar  test loss 5.042, len  test loss 0.041, col  test loss 143.523


Epoch 1536: 272batch [00:51,  5.29batch/s, loss=1.57e+3]


epoch 1536: avg train loss 1572.27, bar train loss 3.827, len train loss 0.037, col train loss 142.949


Epoch 1537: 0batch [00:00, ?batch/s]

epoch 1536: avg test  loss 1584.09, bar  test loss 4.154, len  test loss 0.036, col  test loss 143.536


Epoch 1537: 272batch [00:50,  5.35batch/s, loss=1.64e+3]


epoch 1537: avg train loss 1574.84, bar train loss 3.735, len train loss 0.036, col train loss 143.784


Epoch 1538: 0batch [00:00, ?batch/s]

epoch 1537: avg test  loss 1589.80, bar  test loss 4.454, len  test loss 0.037, col  test loss 144.707


Epoch 1538: 272batch [00:50,  5.34batch/s, loss=1.52e+3]


epoch 1538: avg train loss 1573.98, bar train loss 3.911, len train loss 0.036, col train loss 143.264


Epoch 1539: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1538: avg test  loss 1582.42, bar  test loss 3.795, len  test loss 0.035, col  test loss 143.946


Epoch 1539: 272batch [00:50,  5.43batch/s, loss=1.49e+3]


epoch 1539: avg train loss 1577.95, bar train loss 4.040, len train loss 0.037, col train loss 143.549


Epoch 1540: 0batch [00:00, ?batch/s]

epoch 1539: avg test  loss 1583.88, bar  test loss 4.150, len  test loss 0.035, col  test loss 144.497


Epoch 1540: 272batch [00:51,  5.27batch/s, loss=1.56e+3]


epoch 1540: avg train loss 1573.73, bar train loss 3.870, len train loss 0.036, col train loss 142.786
epoch 1540: avg test  loss 1587.20, bar  test loss 4.432, len  test loss 0.040, col  test loss 143.856


Epoch 1541: 272batch [00:51,  5.23batch/s, loss=1.61e+3]


epoch 1541: avg train loss 1566.00, bar train loss 3.684, len train loss 0.036, col train loss 142.012


Epoch 1542: 0batch [00:00, ?batch/s]

epoch 1541: avg test  loss 1578.22, bar  test loss 4.262, len  test loss 0.038, col  test loss 142.483


Epoch 1542: 272batch [00:50,  5.35batch/s, loss=1.66e+3]


epoch 1542: avg train loss 1569.48, bar train loss 3.808, len train loss 0.036, col train loss 142.571


Epoch 1543: 0batch [00:00, ?batch/s]

epoch 1542: avg test  loss 1580.18, bar  test loss 3.865, len  test loss 0.038, col  test loss 143.652


Epoch 1543: 272batch [00:50,  5.37batch/s, loss=1.48e+3]


epoch 1543: avg train loss 1571.49, bar train loss 3.778, len train loss 0.037, col train loss 142.870


Epoch 1544: 0batch [00:00, ?batch/s]

epoch 1543: avg test  loss 1582.05, bar  test loss 4.072, len  test loss 0.046, col  test loss 143.079


Epoch 1544: 272batch [00:50,  5.38batch/s, loss=1.57e+3]


epoch 1544: avg train loss 1568.47, bar train loss 3.898, len train loss 0.038, col train loss 142.493


Epoch 1545: 0batch [00:00, ?batch/s]

epoch 1544: avg test  loss 1586.95, bar  test loss 4.543, len  test loss 0.049, col  test loss 143.939


Epoch 1545: 272batch [00:51,  5.32batch/s, loss=1.58e+3]


epoch 1545: avg train loss 1569.70, bar train loss 3.892, len train loss 0.036, col train loss 142.844
epoch 1545: avg test  loss 1579.80, bar  test loss 3.918, len  test loss 0.040, col  test loss 144.815


Epoch 1546: 272batch [00:51,  5.29batch/s, loss=1.55e+3]


epoch 1546: avg train loss 1572.92, bar train loss 3.920, len train loss 0.037, col train loss 143.007


Epoch 1547: 0batch [00:00, ?batch/s]

epoch 1546: avg test  loss 1592.30, bar  test loss 5.155, len  test loss 0.036, col  test loss 144.053


Epoch 1547: 272batch [00:52,  5.21batch/s, loss=1.65e+3]


epoch 1547: avg train loss 1569.80, bar train loss 3.709, len train loss 0.037, col train loss 143.038


Epoch 1548: 0batch [00:00, ?batch/s]

epoch 1547: avg test  loss 1584.18, bar  test loss 4.123, len  test loss 0.048, col  test loss 143.334


Epoch 1548: 272batch [00:50,  5.39batch/s, loss=1.62e+3]


epoch 1548: avg train loss 1572.82, bar train loss 4.024, len train loss 0.037, col train loss 143.094


Epoch 1549: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1548: avg test  loss 1589.04, bar  test loss 4.876, len  test loss 0.039, col  test loss 143.855


Epoch 1549: 272batch [00:50,  5.38batch/s, loss=1.53e+3]


epoch 1549: avg train loss 1570.34, bar train loss 3.827, len train loss 0.036, col train loss 142.422


Epoch 1550: 0batch [00:00, ?batch/s]

epoch 1549: avg test  loss 1587.22, bar  test loss 4.106, len  test loss 0.039, col  test loss 144.174


Epoch 1550: 272batch [00:50,  5.36batch/s, loss=1.5e+3] 


epoch 1550: avg train loss 1572.58, bar train loss 3.997, len train loss 0.038, col train loss 142.907
epoch 1550: avg test  loss 1577.09, bar  test loss 3.872, len  test loss 0.040, col  test loss 144.325


Epoch 1551: 272batch [00:51,  5.30batch/s, loss=1.65e+3]


epoch 1551: avg train loss 1569.86, bar train loss 3.881, len train loss 0.038, col train loss 142.979


Epoch 1552: 0batch [00:00, ?batch/s]

epoch 1551: avg test  loss 1604.51, bar  test loss 4.674, len  test loss 0.040, col  test loss 145.320


Epoch 1552: 272batch [00:51,  5.26batch/s, loss=1.87e+3]


epoch 1552: avg train loss 1581.52, bar train loss 4.048, len train loss 0.041, col train loss 143.563


Epoch 1553: 0batch [00:00, ?batch/s]

epoch 1552: avg test  loss 1587.06, bar  test loss 4.713, len  test loss 0.045, col  test loss 143.576


Epoch 1553: 272batch [00:50,  5.35batch/s, loss=1.6e+3] 


epoch 1553: avg train loss 1578.71, bar train loss 4.149, len train loss 0.040, col train loss 143.235


Epoch 1554: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1553: avg test  loss 1586.59, bar  test loss 3.888, len  test loss 0.035, col  test loss 144.129


Epoch 1554: 272batch [00:51,  5.32batch/s, loss=1.71e+3]


epoch 1554: avg train loss 1579.32, bar train loss 3.782, len train loss 0.037, col train loss 143.704


Epoch 1555: 0batch [00:00, ?batch/s]

epoch 1554: avg test  loss 1584.47, bar  test loss 4.273, len  test loss 0.038, col  test loss 143.018


Epoch 1555: 272batch [00:51,  5.30batch/s, loss=1.66e+3]


epoch 1555: avg train loss 1567.66, bar train loss 3.838, len train loss 0.035, col train loss 142.173
epoch 1555: avg test  loss 1578.04, bar  test loss 4.127, len  test loss 0.038, col  test loss 143.244


Epoch 1556: 272batch [00:51,  5.28batch/s, loss=1.57e+3]


epoch 1556: avg train loss 1574.13, bar train loss 4.039, len train loss 0.037, col train loss 142.864


Epoch 1557: 0batch [00:00, ?batch/s]

epoch 1556: avg test  loss 1585.40, bar  test loss 3.905, len  test loss 0.042, col  test loss 143.425


Epoch 1557: 272batch [00:52,  5.20batch/s, loss=1.59e+3]


epoch 1557: avg train loss 1571.81, bar train loss 3.911, len train loss 0.038, col train loss 142.462


Epoch 1558: 0batch [00:00, ?batch/s]

epoch 1557: avg test  loss 1580.77, bar  test loss 4.272, len  test loss 0.036, col  test loss 143.084


Epoch 1558: 272batch [00:51,  5.32batch/s, loss=1.58e+3]


epoch 1558: avg train loss 1576.22, bar train loss 4.336, len train loss 0.037, col train loss 142.863


Epoch 1559: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1558: avg test  loss 1587.90, bar  test loss 4.250, len  test loss 0.039, col  test loss 144.174


Epoch 1559: 272batch [00:50,  5.36batch/s, loss=1.51e+3]


epoch 1559: avg train loss 1572.45, bar train loss 3.857, len train loss 0.035, col train loss 142.654


Epoch 1560: 0batch [00:00, ?batch/s]

epoch 1559: avg test  loss 1584.52, bar  test loss 3.791, len  test loss 0.038, col  test loss 144.589


Epoch 1560: 272batch [00:51,  5.29batch/s, loss=1.6e+3] 


epoch 1560: avg train loss 1576.58, bar train loss 3.861, len train loss 0.039, col train loss 143.384
epoch 1560: avg test  loss 1587.34, bar  test loss 3.858, len  test loss 0.034, col  test loss 143.490


Epoch 1561: 272batch [00:52,  5.16batch/s, loss=1.7e+3] 


epoch 1561: avg train loss 1574.53, bar train loss 3.739, len train loss 0.035, col train loss 143.077


Epoch 1562: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1561: avg test  loss 1579.74, bar  test loss 4.061, len  test loss 0.037, col  test loss 142.433


Epoch 1562: 272batch [00:51,  5.24batch/s, loss=1.62e+3]


epoch 1562: avg train loss 1578.77, bar train loss 3.979, len train loss 0.036, col train loss 143.063


Epoch 1563: 0batch [00:00, ?batch/s]

epoch 1562: avg test  loss 1579.03, bar  test loss 3.881, len  test loss 0.038, col  test loss 143.946


Epoch 1563: 272batch [00:50,  5.33batch/s, loss=1.7e+3] 


epoch 1563: avg train loss 1575.51, bar train loss 4.159, len train loss 0.037, col train loss 142.995


Epoch 1564: 0batch [00:00, ?batch/s, loss=1.53e+3]

epoch 1563: avg test  loss 1604.06, bar  test loss 5.562, len  test loss 0.036, col  test loss 144.193


Epoch 1564: 272batch [00:51,  5.30batch/s, loss=1.55e+3]


epoch 1564: avg train loss 1573.59, bar train loss 3.902, len train loss 0.036, col train loss 142.656


Epoch 1565: 0batch [00:00, ?batch/s, loss=1.52e+3]

epoch 1564: avg test  loss 1583.55, bar  test loss 4.040, len  test loss 0.036, col  test loss 143.033


Epoch 1565: 272batch [00:51,  5.32batch/s, loss=1.62e+3]


epoch 1565: avg train loss 1575.06, bar train loss 3.975, len train loss 0.036, col train loss 142.919
epoch 1565: avg test  loss 1581.23, bar  test loss 3.777, len  test loss 0.037, col  test loss 143.743


Epoch 1566: 272batch [00:52,  5.22batch/s, loss=1.59e+3]


epoch 1566: avg train loss 1570.06, bar train loss 3.739, len train loss 0.037, col train loss 142.888


Epoch 1567: 0batch [00:00, ?batch/s]

epoch 1566: avg test  loss 1578.50, bar  test loss 3.770, len  test loss 0.042, col  test loss 143.405


Epoch 1567: 272batch [00:52,  5.19batch/s, loss=1.67e+3]


epoch 1567: avg train loss 1572.43, bar train loss 3.910, len train loss 0.039, col train loss 143.264


Epoch 1568: 0batch [00:00, ?batch/s, loss=1.6e+3]

epoch 1567: avg test  loss 1602.24, bar  test loss 5.038, len  test loss 0.040, col  test loss 144.906


Epoch 1568: 272batch [00:51,  5.25batch/s, loss=1.65e+3]


epoch 1568: avg train loss 1575.25, bar train loss 4.078, len train loss 0.036, col train loss 143.359


Epoch 1569: 0batch [00:00, ?batch/s]

epoch 1568: avg test  loss 1588.31, bar  test loss 4.494, len  test loss 0.036, col  test loss 144.456


Epoch 1569: 272batch [00:51,  5.25batch/s, loss=1.57e+3]


epoch 1569: avg train loss 1575.48, bar train loss 3.797, len train loss 0.036, col train loss 143.282


Epoch 1570: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1569: avg test  loss 1607.11, bar  test loss 5.130, len  test loss 0.041, col  test loss 145.423


Epoch 1570: 272batch [00:51,  5.29batch/s, loss=1.69e+3]


epoch 1570: avg train loss 1577.80, bar train loss 3.809, len train loss 0.035, col train loss 143.144
epoch 1570: avg test  loss 1585.72, bar  test loss 3.984, len  test loss 0.038, col  test loss 144.292


Epoch 1571: 272batch [00:51,  5.27batch/s, loss=1.43e+3]


epoch 1571: avg train loss 1572.43, bar train loss 3.754, len train loss 0.036, col train loss 143.493


Epoch 1572: 0batch [00:00, ?batch/s]

epoch 1571: avg test  loss 1585.41, bar  test loss 4.235, len  test loss 0.040, col  test loss 143.770


Epoch 1572: 272batch [00:52,  5.23batch/s, loss=1.69e+3]


epoch 1572: avg train loss 1576.68, bar train loss 3.851, len train loss 0.037, col train loss 143.560


Epoch 1573: 0batch [00:00, ?batch/s, loss=1.62e+3]

epoch 1572: avg test  loss 1587.66, bar  test loss 4.016, len  test loss 0.043, col  test loss 144.008


Epoch 1573: 272batch [00:51,  5.26batch/s, loss=1.57e+3]


epoch 1573: avg train loss 1576.57, bar train loss 3.976, len train loss 0.038, col train loss 143.488


Epoch 1574: 0batch [00:00, ?batch/s]

epoch 1573: avg test  loss 1575.29, bar  test loss 3.764, len  test loss 0.037, col  test loss 143.416


Epoch 1574: 272batch [00:51,  5.23batch/s, loss=1.79e+3]


epoch 1574: avg train loss 1573.29, bar train loss 3.751, len train loss 0.036, col train loss 143.411


Epoch 1575: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1574: avg test  loss 1592.32, bar  test loss 4.502, len  test loss 0.036, col  test loss 143.999


Epoch 1575: 272batch [00:51,  5.26batch/s, loss=1.46e+3]


epoch 1575: avg train loss 1576.16, bar train loss 3.939, len train loss 0.037, col train loss 143.202
epoch 1575: avg test  loss 1582.95, bar  test loss 4.000, len  test loss 0.039, col  test loss 143.895


Epoch 1576: 272batch [00:51,  5.28batch/s, loss=1.59e+3]


epoch 1576: avg train loss 1578.38, bar train loss 3.880, len train loss 0.038, col train loss 143.749


Epoch 1577: 0batch [00:00, ?batch/s]

epoch 1576: avg test  loss 1597.74, bar  test loss 4.961, len  test loss 0.039, col  test loss 144.403


Epoch 1577: 272batch [00:52,  5.22batch/s, loss=1.63e+3]


epoch 1577: avg train loss 1584.28, bar train loss 3.986, len train loss 0.038, col train loss 144.233


Epoch 1578: 0batch [00:00, ?batch/s]

epoch 1577: avg test  loss 1669.73, bar  test loss 8.821, len  test loss 0.050, col  test loss 147.338


Epoch 1578: 272batch [00:52,  5.15batch/s, loss=1.57e+3]


epoch 1578: avg train loss 1581.33, bar train loss 4.168, len train loss 0.036, col train loss 143.549


Epoch 1579: 0batch [00:00, ?batch/s]

epoch 1578: avg test  loss 1587.72, bar  test loss 4.472, len  test loss 0.041, col  test loss 143.790


Epoch 1579: 272batch [00:51,  5.26batch/s, loss=1.41e+3]


epoch 1579: avg train loss 1574.21, bar train loss 3.867, len train loss 0.035, col train loss 143.257


Epoch 1580: 0batch [00:00, ?batch/s]

epoch 1579: avg test  loss 1580.47, bar  test loss 3.820, len  test loss 0.039, col  test loss 143.847


Epoch 1580: 272batch [00:51,  5.31batch/s, loss=1.69e+3]


epoch 1580: avg train loss 1572.44, bar train loss 3.767, len train loss 0.036, col train loss 143.198
epoch 1580: avg test  loss 1621.68, bar  test loss 8.291, len  test loss 0.039, col  test loss 143.374


Epoch 1581: 272batch [00:51,  5.27batch/s, loss=1.64e+3]


epoch 1581: avg train loss 1579.23, bar train loss 4.258, len train loss 0.037, col train loss 143.397


Epoch 1582: 0batch [00:00, ?batch/s, loss=1.62e+3]

epoch 1581: avg test  loss 1594.39, bar  test loss 4.449, len  test loss 0.036, col  test loss 145.217


Epoch 1582: 272batch [00:51,  5.29batch/s, loss=1.6e+3] 


epoch 1582: avg train loss 1575.53, bar train loss 3.798, len train loss 0.036, col train loss 143.274


Epoch 1583: 0batch [00:00, ?batch/s]

epoch 1582: avg test  loss 1589.42, bar  test loss 4.135, len  test loss 0.042, col  test loss 144.878


Epoch 1583: 272batch [00:52,  5.15batch/s, loss=1.46e+3]


epoch 1583: avg train loss 1582.46, bar train loss 4.126, len train loss 0.036, col train loss 143.719


Epoch 1584: 0batch [00:00, ?batch/s]

epoch 1583: avg test  loss 1590.40, bar  test loss 4.083, len  test loss 0.037, col  test loss 144.659


Epoch 1584: 272batch [00:52,  5.22batch/s, loss=1.63e+3]


epoch 1584: avg train loss 1574.47, bar train loss 3.951, len train loss 0.037, col train loss 143.357


Epoch 1585: 0batch [00:00, ?batch/s]

epoch 1584: avg test  loss 1582.80, bar  test loss 3.912, len  test loss 0.047, col  test loss 143.742


Epoch 1585: 272batch [00:52,  5.23batch/s, loss=1.44e+3]


epoch 1585: avg train loss 1576.50, bar train loss 3.887, len train loss 0.037, col train loss 143.221
epoch 1585: avg test  loss 1583.29, bar  test loss 3.853, len  test loss 0.038, col  test loss 143.427


Epoch 1586: 272batch [00:51,  5.26batch/s, loss=1.56e+3]


epoch 1586: avg train loss 1573.99, bar train loss 3.696, len train loss 0.037, col train loss 143.259


Epoch 1587: 0batch [00:00, ?batch/s]

epoch 1586: avg test  loss 1605.71, bar  test loss 5.294, len  test loss 0.039, col  test loss 144.291


Epoch 1587: 272batch [00:52,  5.20batch/s, loss=1.57e+3]


epoch 1587: avg train loss 1577.53, bar train loss 3.953, len train loss 0.039, col train loss 143.337


Epoch 1588: 0batch [00:00, ?batch/s]

epoch 1587: avg test  loss 1583.29, bar  test loss 4.164, len  test loss 0.041, col  test loss 144.300


Epoch 1588: 272batch [00:52,  5.18batch/s, loss=1.68e+3]


epoch 1588: avg train loss 1575.18, bar train loss 3.926, len train loss 0.037, col train loss 143.169


Epoch 1589: 0batch [00:00, ?batch/s]

epoch 1588: avg test  loss 1591.44, bar  test loss 4.345, len  test loss 0.038, col  test loss 145.094


Epoch 1589: 272batch [00:51,  5.23batch/s, loss=1.61e+3]


epoch 1589: avg train loss 1575.92, bar train loss 3.859, len train loss 0.035, col train loss 143.714


Epoch 1590: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1589: avg test  loss 1588.52, bar  test loss 3.930, len  test loss 0.042, col  test loss 145.399


Epoch 1590: 272batch [00:51,  5.26batch/s, loss=1.66e+3]


epoch 1590: avg train loss 1580.48, bar train loss 3.774, len train loss 0.038, col train loss 143.498
epoch 1590: avg test  loss 1595.70, bar  test loss 4.369, len  test loss 0.041, col  test loss 145.199


Epoch 1591: 272batch [00:51,  5.25batch/s, loss=1.67e+3]


epoch 1591: avg train loss 1575.10, bar train loss 4.003, len train loss 0.036, col train loss 143.523


Epoch 1592: 0batch [00:00, ?batch/s]

epoch 1591: avg test  loss 1585.85, bar  test loss 4.067, len  test loss 0.035, col  test loss 144.081


Epoch 1592: 272batch [00:52,  5.21batch/s, loss=1.6e+3] 


epoch 1592: avg train loss 1579.09, bar train loss 4.023, len train loss 0.035, col train loss 143.527


Epoch 1593: 0batch [00:00, ?batch/s]

epoch 1592: avg test  loss 1587.54, bar  test loss 3.876, len  test loss 0.038, col  test loss 144.444


Epoch 1593: 272batch [00:53,  5.10batch/s, loss=1.57e+3]


epoch 1593: avg train loss 1576.66, bar train loss 3.791, len train loss 0.035, col train loss 143.818


Epoch 1594: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1593: avg test  loss 1590.46, bar  test loss 4.135, len  test loss 0.035, col  test loss 144.906


Epoch 1594: 272batch [00:52,  5.17batch/s, loss=1.58e+3]


epoch 1594: avg train loss 1579.99, bar train loss 4.045, len train loss 0.036, col train loss 143.676


Epoch 1595: 0batch [00:00, ?batch/s]

epoch 1594: avg test  loss 1592.91, bar  test loss 4.397, len  test loss 0.037, col  test loss 143.892


Epoch 1595: 272batch [00:52,  5.17batch/s, loss=1.66e+3]


epoch 1595: avg train loss 1579.76, bar train loss 4.152, len train loss 0.035, col train loss 143.339
epoch 1595: avg test  loss 1584.49, bar  test loss 4.179, len  test loss 0.041, col  test loss 144.104


Epoch 1596: 272batch [00:52,  5.22batch/s, loss=1.67e+3]


epoch 1596: avg train loss 1578.17, bar train loss 4.043, len train loss 0.036, col train loss 143.524


Epoch 1597: 0batch [00:00, ?batch/s]

epoch 1596: avg test  loss 1588.89, bar  test loss 4.322, len  test loss 0.041, col  test loss 144.051


Epoch 1597: 272batch [00:52,  5.23batch/s, loss=1.47e+3]


epoch 1597: avg train loss 1572.62, bar train loss 3.863, len train loss 0.036, col train loss 143.128


Epoch 1598: 0batch [00:00, ?batch/s]

epoch 1597: avg test  loss 1579.96, bar  test loss 4.043, len  test loss 0.040, col  test loss 144.346


Epoch 1598: 272batch [00:52,  5.21batch/s, loss=1.55e+3]


epoch 1598: avg train loss 1581.93, bar train loss 4.377, len train loss 0.039, col train loss 143.831


Epoch 1599: 0batch [00:00, ?batch/s]

epoch 1598: avg test  loss 1647.35, bar  test loss 8.802, len  test loss 0.040, col  test loss 144.837


Epoch 1599: 272batch [00:51,  5.31batch/s, loss=1.7e+3] 


epoch 1599: avg train loss 1591.79, bar train loss 4.376, len train loss 0.038, col train loss 144.541


Epoch 1600: 0batch [00:00, ?batch/s]

epoch 1599: avg test  loss 1598.45, bar  test loss 4.536, len  test loss 0.034, col  test loss 144.710


Epoch 1600: 272batch [00:49,  5.47batch/s, loss=1.7e+3] 


epoch 1600: avg train loss 1581.13, bar train loss 3.687, len train loss 0.037, col train loss 143.702
epoch 1600: avg test  loss 1605.73, bar  test loss 4.170, len  test loss 0.051, col  test loss 146.307


Epoch 1601: 272batch [00:49,  5.45batch/s, loss=1.62e+3]


epoch 1601: avg train loss 1581.92, bar train loss 4.029, len train loss 0.041, col train loss 143.623


Epoch 1602: 0batch [00:00, ?batch/s]

epoch 1601: avg test  loss 1591.86, bar  test loss 4.422, len  test loss 0.039, col  test loss 144.219


Epoch 1602: 272batch [00:50,  5.37batch/s, loss=1.62e+3]


epoch 1602: avg train loss 1588.29, bar train loss 4.251, len train loss 0.041, col train loss 144.484


Epoch 1603: 0batch [00:00, ?batch/s]

epoch 1602: avg test  loss 1594.97, bar  test loss 4.121, len  test loss 0.037, col  test loss 144.842


Epoch 1603: 272batch [00:51,  5.33batch/s, loss=1.61e+3]


epoch 1603: avg train loss 1583.31, bar train loss 4.000, len train loss 0.037, col train loss 144.007


Epoch 1604: 0batch [00:00, ?batch/s, loss=1.63e+3]

epoch 1603: avg test  loss 1615.53, bar  test loss 5.601, len  test loss 0.043, col  test loss 147.341


Epoch 1604: 272batch [00:50,  5.38batch/s, loss=1.47e+3]


epoch 1604: avg train loss 1577.75, bar train loss 3.804, len train loss 0.036, col train loss 143.897


Epoch 1605: 0batch [00:00, ?batch/s]

epoch 1604: avg test  loss 1586.96, bar  test loss 3.990, len  test loss 0.035, col  test loss 144.256


Epoch 1605: 272batch [00:50,  5.36batch/s, loss=1.45e+3]


epoch 1605: avg train loss 1576.60, bar train loss 3.924, len train loss 0.036, col train loss 143.405
epoch 1605: avg test  loss 1590.76, bar  test loss 4.052, len  test loss 0.041, col  test loss 145.653


Epoch 1606: 272batch [00:49,  5.44batch/s, loss=1.52e+3]


epoch 1606: avg train loss 1577.53, bar train loss 3.823, len train loss 0.038, col train loss 143.422


Epoch 1607: 0batch [00:00, ?batch/s, loss=1.5e+3]

epoch 1606: avg test  loss 1591.41, bar  test loss 4.061, len  test loss 0.039, col  test loss 145.013


Epoch 1607: 272batch [00:49,  5.44batch/s, loss=1.61e+3]


epoch 1607: avg train loss 1582.15, bar train loss 4.067, len train loss 0.038, col train loss 143.752


Epoch 1608: 0batch [00:00, ?batch/s, loss=1.54e+3]

epoch 1607: avg test  loss 1585.70, bar  test loss 3.817, len  test loss 0.042, col  test loss 144.683


Epoch 1608: 272batch [00:50,  5.42batch/s, loss=1.67e+3]


epoch 1608: avg train loss 1575.44, bar train loss 3.995, len train loss 0.036, col train loss 143.034


Epoch 1609: 0batch [00:00, ?batch/s]

epoch 1608: avg test  loss 1596.34, bar  test loss 4.138, len  test loss 0.040, col  test loss 145.984


Epoch 1609: 272batch [00:50,  5.42batch/s, loss=1.54e+3]


epoch 1609: avg train loss 1577.38, bar train loss 4.033, len train loss 0.037, col train loss 143.491


Epoch 1610: 0batch [00:00, ?batch/s]

epoch 1609: avg test  loss 1582.80, bar  test loss 4.038, len  test loss 0.039, col  test loss 144.228


Epoch 1610: 272batch [00:50,  5.36batch/s, loss=1.68e+3]


epoch 1610: avg train loss 1575.79, bar train loss 3.919, len train loss 0.035, col train loss 143.361
epoch 1610: avg test  loss 1597.48, bar  test loss 5.546, len  test loss 0.035, col  test loss 144.134


Epoch 1611: 272batch [00:50,  5.38batch/s, loss=1.72e+3]


epoch 1611: avg train loss 1576.96, bar train loss 3.945, len train loss 0.035, col train loss 143.442


Epoch 1612: 0batch [00:00, ?batch/s]

epoch 1611: avg test  loss 1603.20, bar  test loss 5.131, len  test loss 0.034, col  test loss 145.304


Epoch 1612: 272batch [00:49,  5.44batch/s, loss=1.55e+3]


epoch 1612: avg train loss 1576.83, bar train loss 3.954, len train loss 0.035, col train loss 143.506


Epoch 1613: 0batch [00:00, ?batch/s]

epoch 1612: avg test  loss 1596.33, bar  test loss 4.325, len  test loss 0.036, col  test loss 144.503


Epoch 1613: 272batch [00:50,  5.43batch/s, loss=1.63e+3]


epoch 1613: avg train loss 1576.99, bar train loss 3.866, len train loss 0.037, col train loss 143.102


Epoch 1614: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1613: avg test  loss 1582.65, bar  test loss 3.691, len  test loss 0.037, col  test loss 143.239


Epoch 1614: 272batch [00:49,  5.46batch/s, loss=1.69e+3]


epoch 1614: avg train loss 1578.43, bar train loss 3.878, len train loss 0.038, col train loss 143.413


Epoch 1615: 0batch [00:00, ?batch/s]

epoch 1614: avg test  loss 1595.47, bar  test loss 4.166, len  test loss 0.037, col  test loss 145.251


Epoch 1615: 272batch [00:50,  5.37batch/s, loss=1.7e+3] 


epoch 1615: avg train loss 1580.94, bar train loss 3.798, len train loss 0.035, col train loss 144.455
epoch 1615: avg test  loss 1583.65, bar  test loss 4.007, len  test loss 0.039, col  test loss 144.767


Epoch 1616: 272batch [00:50,  5.34batch/s, loss=1.63e+3]


epoch 1616: avg train loss 1575.74, bar train loss 3.952, len train loss 0.037, col train loss 143.581


Epoch 1617: 0batch [00:00, ?batch/s, loss=1.57e+3]

epoch 1616: avg test  loss 1587.47, bar  test loss 4.423, len  test loss 0.038, col  test loss 144.506


Epoch 1617: 272batch [00:50,  5.36batch/s, loss=1.61e+3]


epoch 1617: avg train loss 1578.86, bar train loss 4.018, len train loss 0.038, col train loss 143.361


Epoch 1618: 0batch [00:00, ?batch/s]

epoch 1617: avg test  loss 1589.02, bar  test loss 4.072, len  test loss 0.037, col  test loss 144.506


Epoch 1618: 272batch [00:49,  5.45batch/s, loss=1.64e+3]


epoch 1618: avg train loss 1583.03, bar train loss 3.977, len train loss 0.037, col train loss 143.776


Epoch 1619: 0batch [00:00, ?batch/s, loss=1.6e+3]

epoch 1618: avg test  loss 1600.94, bar  test loss 4.506, len  test loss 0.044, col  test loss 145.356


Epoch 1619: 272batch [00:51,  5.30batch/s, loss=1.45e+3]


epoch 1619: avg train loss 1581.24, bar train loss 3.814, len train loss 0.037, col train loss 144.013


Epoch 1620: 0batch [00:00, ?batch/s]

epoch 1619: avg test  loss 1589.99, bar  test loss 4.479, len  test loss 0.041, col  test loss 144.417


Epoch 1620: 272batch [00:50,  5.40batch/s, loss=1.6e+3] 


epoch 1620: avg train loss 1573.47, bar train loss 3.842, len train loss 0.035, col train loss 142.688
epoch 1620: avg test  loss 1601.56, bar  test loss 5.208, len  test loss 0.040, col  test loss 144.697


Epoch 1621: 272batch [00:50,  5.36batch/s, loss=1.72e+3]


epoch 1621: avg train loss 1585.01, bar train loss 4.159, len train loss 0.037, col train loss 144.108


Epoch 1622: 0batch [00:00, ?batch/s]

epoch 1621: avg test  loss 1597.12, bar  test loss 4.608, len  test loss 0.044, col  test loss 144.441


Epoch 1622: 272batch [00:51,  5.32batch/s, loss=1.71e+3]


epoch 1622: avg train loss 1585.39, bar train loss 4.206, len train loss 0.040, col train loss 143.888


Epoch 1623: 0batch [00:00, ?batch/s]

epoch 1622: avg test  loss 1650.81, bar  test loss 9.995, len  test loss 0.040, col  test loss 144.133


Epoch 1623: 272batch [00:50,  5.37batch/s, loss=1.47e+3]


epoch 1623: avg train loss 1580.75, bar train loss 4.056, len train loss 0.037, col train loss 143.864


Epoch 1624: 0batch [00:00, ?batch/s]

epoch 1623: avg test  loss 1587.77, bar  test loss 4.134, len  test loss 0.035, col  test loss 144.299


Epoch 1624: 272batch [00:50,  5.37batch/s, loss=1.6e+3] 


epoch 1624: avg train loss 1579.95, bar train loss 4.015, len train loss 0.036, col train loss 143.705


Epoch 1625: 0batch [00:00, ?batch/s]

epoch 1624: avg test  loss 1601.02, bar  test loss 4.024, len  test loss 0.038, col  test loss 143.612


Epoch 1625: 272batch [00:50,  5.38batch/s, loss=1.54e+3]


epoch 1625: avg train loss 1585.06, bar train loss 4.457, len train loss 0.037, col train loss 143.431
epoch 1625: avg test  loss 1610.12, bar  test loss 5.769, len  test loss 0.035, col  test loss 144.817


Epoch 1626: 272batch [00:50,  5.43batch/s, loss=1.78e+3]


epoch 1626: avg train loss 1583.73, bar train loss 4.000, len train loss 0.036, col train loss 144.299


Epoch 1627: 0batch [00:00, ?batch/s]

epoch 1626: avg test  loss 1598.21, bar  test loss 4.085, len  test loss 0.044, col  test loss 145.148


Epoch 1627: 272batch [00:50,  5.35batch/s, loss=1.59e+3]


epoch 1627: avg train loss 1582.58, bar train loss 3.950, len train loss 0.037, col train loss 144.068


Epoch 1628: 0batch [00:00, ?batch/s]

epoch 1627: avg test  loss 1586.24, bar  test loss 3.917, len  test loss 0.037, col  test loss 144.918


Epoch 1628: 272batch [00:51,  5.31batch/s, loss=1.49e+3]


epoch 1628: avg train loss 1585.66, bar train loss 4.131, len train loss 0.040, col train loss 144.284


Epoch 1629: 0batch [00:00, ?batch/s]

epoch 1628: avg test  loss 1590.82, bar  test loss 3.977, len  test loss 0.040, col  test loss 144.734


Epoch 1629: 272batch [00:50,  5.37batch/s, loss=1.48e+3]


epoch 1629: avg train loss 1581.72, bar train loss 4.116, len train loss 0.037, col train loss 143.493


Epoch 1630: 0batch [00:00, ?batch/s, loss=1.56e+3]

epoch 1629: avg test  loss 1593.44, bar  test loss 4.602, len  test loss 0.035, col  test loss 144.520


Epoch 1630: 272batch [00:50,  5.36batch/s, loss=1.69e+3]


epoch 1630: avg train loss 1580.05, bar train loss 3.827, len train loss 0.037, col train loss 144.134
epoch 1630: avg test  loss 1590.37, bar  test loss 3.772, len  test loss 0.040, col  test loss 145.739


Epoch 1631: 272batch [00:50,  5.41batch/s, loss=1.68e+3]


epoch 1631: avg train loss 1582.75, bar train loss 3.929, len train loss 0.040, col train loss 144.123


Epoch 1632: 0batch [00:00, ?batch/s]

epoch 1631: avg test  loss 1590.95, bar  test loss 3.799, len  test loss 0.039, col  test loss 143.943


Epoch 1632: 272batch [00:50,  5.38batch/s, loss=1.8e+3] 


epoch 1632: avg train loss 1582.61, bar train loss 3.794, len train loss 0.037, col train loss 144.205


Epoch 1633: 0batch [00:00, ?batch/s]

epoch 1632: avg test  loss 1590.84, bar  test loss 4.045, len  test loss 0.036, col  test loss 145.745


Epoch 1633: 272batch [00:50,  5.36batch/s, loss=1.61e+3]


epoch 1633: avg train loss 1593.29, bar train loss 4.307, len train loss 0.050, col train loss 144.698


Epoch 1634: 0batch [00:00, ?batch/s, loss=1.6e+3]

epoch 1633: avg test  loss 1591.91, bar  test loss 4.121, len  test loss 0.040, col  test loss 144.770


Epoch 1634: 272batch [00:51,  5.31batch/s, loss=1.72e+3]


epoch 1634: avg train loss 1587.23, bar train loss 3.965, len train loss 0.036, col train loss 144.605


Epoch 1635: 0batch [00:00, ?batch/s]

epoch 1634: avg test  loss 1611.55, bar  test loss 4.600, len  test loss 0.041, col  test loss 146.561


Epoch 1635: 272batch [00:50,  5.42batch/s, loss=1.56e+3]


epoch 1635: avg train loss 1584.50, bar train loss 3.984, len train loss 0.039, col train loss 144.253
epoch 1635: avg test  loss 1592.13, bar  test loss 4.299, len  test loss 0.038, col  test loss 145.460


Epoch 1636: 272batch [00:50,  5.34batch/s, loss=1.52e+3]


epoch 1636: avg train loss 1588.19, bar train loss 4.287, len train loss 0.037, col train loss 144.161


Epoch 1637: 0batch [00:00, ?batch/s, loss=1.55e+3]

epoch 1636: avg test  loss 1600.14, bar  test loss 4.218, len  test loss 0.037, col  test loss 145.303


Epoch 1637: 272batch [00:51,  5.30batch/s, loss=1.59e+3]


epoch 1637: avg train loss 1581.63, bar train loss 3.767, len train loss 0.035, col train loss 143.853


Epoch 1638: 0batch [00:00, ?batch/s]

epoch 1637: avg test  loss 1594.02, bar  test loss 3.856, len  test loss 0.036, col  test loss 144.134


Epoch 1638: 272batch [00:51,  5.26batch/s, loss=1.6e+3] 


epoch 1638: avg train loss 1587.20, bar train loss 3.966, len train loss 0.040, col train loss 144.269


Epoch 1639: 0batch [00:00, ?batch/s]

epoch 1638: avg test  loss 1587.90, bar  test loss 3.985, len  test loss 0.042, col  test loss 145.025


Epoch 1639: 272batch [00:50,  5.37batch/s, loss=1.52e+3]


epoch 1639: avg train loss 1582.39, bar train loss 3.986, len train loss 0.036, col train loss 143.815


Epoch 1640: 0batch [00:00, ?batch/s]

epoch 1639: avg test  loss 1593.82, bar  test loss 4.119, len  test loss 0.037, col  test loss 144.869


Epoch 1640: 272batch [00:51,  5.32batch/s, loss=1.54e+3]


epoch 1640: avg train loss 1581.57, bar train loss 3.841, len train loss 0.036, col train loss 144.213
epoch 1640: avg test  loss 1592.12, bar  test loss 4.009, len  test loss 0.040, col  test loss 144.908


Epoch 1641: 272batch [00:50,  5.38batch/s, loss=1.59e+3]


epoch 1641: avg train loss 1586.88, bar train loss 4.434, len train loss 0.037, col train loss 143.600


Epoch 1642: 0batch [00:00, ?batch/s]

epoch 1641: avg test  loss 1606.91, bar  test loss 4.127, len  test loss 0.044, col  test loss 146.872


Epoch 1642: 272batch [00:50,  5.34batch/s, loss=1.46e+3]


epoch 1642: avg train loss 1581.09, bar train loss 3.857, len train loss 0.036, col train loss 144.131


Epoch 1643: 0batch [00:00, ?batch/s, loss=1.6e+3]

epoch 1642: avg test  loss 1585.27, bar  test loss 3.889, len  test loss 0.038, col  test loss 144.906


Epoch 1643: 272batch [00:50,  5.34batch/s, loss=1.61e+3]


epoch 1643: avg train loss 1578.22, bar train loss 3.878, len train loss 0.036, col train loss 143.611


Epoch 1644: 0batch [00:00, ?batch/s]

epoch 1643: avg test  loss 1585.95, bar  test loss 4.078, len  test loss 0.039, col  test loss 144.753


Epoch 1644: 272batch [00:51,  5.28batch/s, loss=1.61e+3]


epoch 1644: avg train loss 1579.87, bar train loss 3.907, len train loss 0.038, col train loss 143.918


Epoch 1645: 0batch [00:00, ?batch/s]

epoch 1644: avg test  loss 1588.43, bar  test loss 4.163, len  test loss 0.036, col  test loss 144.118


Epoch 1645: 272batch [00:51,  5.32batch/s, loss=1.67e+3]


epoch 1645: avg train loss 1582.91, bar train loss 3.920, len train loss 0.035, col train loss 144.183
epoch 1645: avg test  loss 1620.70, bar  test loss 6.658, len  test loss 0.043, col  test loss 144.757


Epoch 1646: 272batch [00:50,  5.36batch/s, loss=1.55e+3]


epoch 1646: avg train loss 1580.54, bar train loss 3.935, len train loss 0.038, col train loss 143.590


Epoch 1647: 0batch [00:00, ?batch/s]

epoch 1646: avg test  loss 1598.26, bar  test loss 4.267, len  test loss 0.045, col  test loss 145.527


Epoch 1647: 272batch [00:50,  5.35batch/s, loss=1.44e+3]


epoch 1647: avg train loss 1579.04, bar train loss 3.837, len train loss 0.035, col train loss 143.901


Epoch 1648: 0batch [00:00, ?batch/s]

epoch 1647: avg test  loss 1605.08, bar  test loss 4.150, len  test loss 0.040, col  test loss 146.118


Epoch 1648: 272batch [00:50,  5.34batch/s, loss=1.51e+3]


epoch 1648: avg train loss 1583.84, bar train loss 4.075, len train loss 0.037, col train loss 144.325


Epoch 1649: 0batch [00:00, ?batch/s]

epoch 1648: avg test  loss 1600.95, bar  test loss 4.992, len  test loss 0.038, col  test loss 144.950


Epoch 1649: 272batch [00:51,  5.32batch/s, loss=1.68e+3]


epoch 1649: avg train loss 1580.90, bar train loss 3.903, len train loss 0.036, col train loss 144.246


Epoch 1650: 0batch [00:00, ?batch/s]

epoch 1649: avg test  loss 1593.53, bar  test loss 4.548, len  test loss 0.038, col  test loss 145.661


Epoch 1650: 272batch [00:51,  5.28batch/s, loss=1.52e+3]


epoch 1650: avg train loss 1588.89, bar train loss 4.101, len train loss 0.036, col train loss 144.555
epoch 1650: avg test  loss 1600.18, bar  test loss 4.726, len  test loss 0.040, col  test loss 144.614


Epoch 1651: 272batch [00:50,  5.34batch/s, loss=1.63e+3]


epoch 1651: avg train loss 1584.40, bar train loss 3.908, len train loss 0.039, col train loss 144.344


Epoch 1652: 0batch [00:00, ?batch/s]

epoch 1651: avg test  loss 1591.16, bar  test loss 3.954, len  test loss 0.039, col  test loss 145.471


Epoch 1652: 272batch [00:51,  5.31batch/s, loss=1.59e+3]


epoch 1652: avg train loss 1588.11, bar train loss 3.912, len train loss 0.041, col train loss 144.764


Epoch 1653: 0batch [00:00, ?batch/s]

epoch 1652: avg test  loss 1598.42, bar  test loss 3.948, len  test loss 0.046, col  test loss 145.744


Epoch 1653: 272batch [00:51,  5.31batch/s, loss=1.43e+3]


epoch 1653: avg train loss 1584.87, bar train loss 3.929, len train loss 0.038, col train loss 144.276


Epoch 1654: 0batch [00:00, ?batch/s]

epoch 1653: avg test  loss 1587.98, bar  test loss 3.861, len  test loss 0.038, col  test loss 145.119


Epoch 1654: 272batch [00:51,  5.30batch/s, loss=1.65e+3]


epoch 1654: avg train loss 1579.02, bar train loss 3.860, len train loss 0.036, col train loss 143.345


Epoch 1655: 0batch [00:00, ?batch/s]

epoch 1654: avg test  loss 1590.42, bar  test loss 4.278, len  test loss 0.036, col  test loss 143.798


Epoch 1655: 272batch [00:52,  5.22batch/s, loss=1.49e+3]


epoch 1655: avg train loss 1584.12, bar train loss 4.093, len train loss 0.038, col train loss 144.319
epoch 1655: avg test  loss 1595.99, bar  test loss 4.116, len  test loss 0.041, col  test loss 145.052


Epoch 1656: 272batch [00:52,  5.15batch/s, loss=1.44e+3]


epoch 1656: avg train loss 1579.53, bar train loss 3.845, len train loss 0.036, col train loss 143.660


Epoch 1657: 0batch [00:00, ?batch/s]

epoch 1656: avg test  loss 1739.49, bar  test loss 17.449, len  test loss 0.053, col  test loss 146.521


Epoch 1657: 272batch [00:51,  5.29batch/s, loss=1.58e+3]


epoch 1657: avg train loss 1598.34, bar train loss 5.140, len train loss 0.039, col train loss 144.785


Epoch 1658: 0batch [00:00, ?batch/s]

epoch 1657: avg test  loss 1604.92, bar  test loss 4.241, len  test loss 0.042, col  test loss 146.414


Epoch 1658: 272batch [00:51,  5.31batch/s, loss=1.52e+3]


epoch 1658: avg train loss 1583.07, bar train loss 3.815, len train loss 0.036, col train loss 144.411


Epoch 1659: 0batch [00:00, ?batch/s, loss=1.58e+3]

epoch 1658: avg test  loss 1598.11, bar  test loss 3.997, len  test loss 0.038, col  test loss 146.267


Epoch 1659: 272batch [00:51,  5.32batch/s, loss=1.65e+3]


epoch 1659: avg train loss 1586.69, bar train loss 4.009, len train loss 0.037, col train loss 144.777


Epoch 1660: 0batch [00:00, ?batch/s]

epoch 1659: avg test  loss 1598.83, bar  test loss 4.302, len  test loss 0.037, col  test loss 145.984


Epoch 1660: 272batch [00:50,  5.34batch/s, loss=1.64e+3]


epoch 1660: avg train loss 1585.17, bar train loss 3.955, len train loss 0.038, col train loss 144.487
epoch 1660: avg test  loss 1594.82, bar  test loss 3.941, len  test loss 0.038, col  test loss 145.580


Epoch 1661: 272batch [00:51,  5.25batch/s, loss=1.64e+3]


epoch 1661: avg train loss 1582.50, bar train loss 3.812, len train loss 0.036, col train loss 143.959


Epoch 1662: 0batch [00:00, ?batch/s]

epoch 1661: avg test  loss 1601.69, bar  test loss 4.746, len  test loss 0.036, col  test loss 145.471


Epoch 1662: 272batch [00:51,  5.25batch/s, loss=1.53e+3]


epoch 1662: avg train loss 1591.30, bar train loss 4.116, len train loss 0.040, col train loss 144.948


Epoch 1663: 0batch [00:00, ?batch/s]

epoch 1662: avg test  loss 1606.38, bar  test loss 4.478, len  test loss 0.038, col  test loss 144.597


Epoch 1663: 272batch [00:51,  5.28batch/s, loss=1.56e+3]


epoch 1663: avg train loss 1586.85, bar train loss 3.951, len train loss 0.035, col train loss 144.374


RuntimeError: [enforce fail at C:\actions-runner\_work\pytorch\pytorch\builder\windows\pytorch\c10\core\impl\alloc_cpu.cpp:81] data. DefaultCPUAllocator: not enough memory: you tried to allocate 7680000 bytes.

In [None]:
lss2, lss_t2 = train(default_args, train_loader, test_loader, diva, optimizer, 3500, 2000, save_folder="VAE10")

In [None]:
lss, lss_t = train(default_args, train_loader, test_loader, diva, optimizer, 5600, 2200, save_folder="VAE4")

In [None]:
def plot_loss_acc(lss, lss_t):
    fig,ax = plt.subplots()
    ax.plot(lss, label="train loss")
    ax.plot(lss_t, label = "test loss")
    #ax1 = ax.twinx()
    #ax1.plot(yacc, label = "train accuracy", ls='--')
    #ax1.plot(yacc_t, label = "test accuracy", ls='--')

    lines, labels = ax.get_legend_handles_labels()
    #lines2, labels2 = ax1.get_legend_handles_labels()

    ax.legend(lines, labels)

In [None]:
plot_loss_acc(lss, lss_t)

In [None]:
plot_loss_acc(lss3, lss_t3, yacc3, yacc_t3)

In [None]:
def plot_change_latent_var(diva, lat_space="y", var_idx=[0,1,2,3,4,5,6,7], step = 5):
    a = next(enumerate(test_loader))
    with torch.no_grad():
        diva.eval()
        d = a[1][2][:len(var_idx)].to(DEVICE).float()
        x = a[1][0][:len(var_idx)].to(DEVICE).float()
        y = a[1][1][:len(var_idx)].to(DEVICE).float()

        zx, zx_sc = diva.qzx(x)
        zy, zy_sc = diva.qzy(x)
        zd, zd_sc =  diva.qzd(x)

        print(torch.max(zy), torch.min(zy), "sdmax:", torch.max(zy_sc))

        out = change(zx, zy, zd, var_idx, lat_space, diva, step)
    
    fig, ax = plt.subplots(ncols=out.shape[0],nrows=len(var_idx),figsize=(10*4*out.shape[0],10*len(var_idx)))
    for i in range(out.shape[0]):
      for j in range(len(var_idx)):
        ax[j,i].imshow(out[i,j])

In [None]:
def change(zx, zy, zd, idx, lat = "y", model=diva, step = 2):
    
    dif = np.arange(-30,15,step)
    print(torch.max(zy), torch.min(zy))
    out = np.zeros((dif.shape[0], len(idx), 25, 100 ,3))  
    #print(zy.shape, dif.shape[0])
    for i in range(dif.shape[0]):
      for j in range(len(idx)):
        if lat == "y":
            zy[j,idx] = dif[i]
        elif lat == "x":
            zx[j,idx] = dif[i]
        elif lat == "d":
            zd[j,idx] = dif[i]
        len_, bar, col = model.px(zd[j],zx[j],zy[j])
        out[i,j] = model.px.reconstruct_image(len_[None,:], bar, col)
    
    return out



In [None]:
plot_change_latent_var(diva)

In [None]:
fig,ax = plt.subplots()
ax.plot(np.arange(50,120), [i.cpu().detach().numpy() for i in lss2], label="train loss")
ax.plot(np.arange(50,120), [i.cpu().detach().numpy() for i in lss_t2], label = "testloss")
ax1 = ax.twinx()
ax1.plot(np.arange(50,120), yacc2, label = "train")
ax1.plot(np.arange(50,120), yacc_t2, label = "test")

plt.legend()

In [None]:
fig,ax = plt.subplots()
ax.plot(np.arange(120,180), [i.cpu().detach().numpy() for i in lss3], label="train loss")
ax.plot(np.arange(120,180), [i.cpu().detach().numpy() for i in lss_t3], label = "testloss")
ax1 = ax.twinx()
ax1.plot(np.arange(120,180), yacc3, label = "train",c='green')
ax1.plot(np.arange(120,180), yacc_t3, label = "test")

plt.legend()

# Model Evaluation

## Sampling from trained model

In [None]:
def plot_latent_space(lat_space="y"):
    '''
    lat_space: y, d, x
    '''

    

In [None]:
plot(x, out, 0)

In [None]:
fig, ax = plt.subplots(nrows=3, ncols=3)
for i in range(9):
  ax[i//3, i%3].imshow(x[i].cpu().permute(1,2,0))
  
plt.savefig('divastamporg.png')