In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
from torchvision import datasets, transforms
from torch.utils.data import DataLoader, Dataset
import copy
import numpy as np
import matplotlib.pyplot as plt
from tqdm import tqdm
import networkx as nx
from torch.nn.utils import parameters_to_vector, vector_to_parameters

In [2]:
# Graph implementation
def generate_graph(cluster_sizes=[100,100], pin=0.5, pout=0.01, seed=0):
    """Generate a random connected graph"""
    probs = np.array([[pin, pout],[pout, pin]])
    while True:
        g = nx.stochastic_block_model(cluster_sizes, probs)
        if nx.algorithms.components.is_connected(g):
            return g


cluster_sizes = [10, 10]
pin = 0.5
pout = 0.01
seed = 0
alpha = 1e-3
lamda = 1e-1
eta = 1e-3
no_users = sum(cluster_sizes)
batch_size = 20
epochs = 1
it = 2000
G = generate_graph(cluster_sizes, pin, pout, seed)

#nx.draw(G, with_labels=True, node_size=100, alpha=1, linewidths=10)
#plt.show()

In [3]:
# Metropolis weights 
number_nodes = G.number_of_nodes()
weights = np.zeros([number_nodes, number_nodes])
for edge in G.edges():
  i, j = edge[0], edge[1]
  weights[i - 1][j - 1] = 1 / (1 + np.max([G.degree(i), G.degree(j)]))
  weights[j - 1][i - 1] = weights[i - 1][j - 1]

print(weights)

weights = weights + np.diag(1 - np.sum(weights, axis=0))

metropolis_weights = weights
print(metropolis_weights)


[[0.         0.         0.         0.         0.16666667 0.
  0.2        0.14285714 0.         0.         0.         0.
  0.         0.         0.         0.         0.         0.
  0.         0.11111111]
 [0.         0.         0.16666667 0.         0.         0.2
  0.         0.         0.125      0.         0.         0.
  0.         0.         0.         0.         0.         0.
  0.         0.11111111]
 [0.         0.16666667 0.         0.         0.16666667 0.
  0.         0.14285714 0.125      0.         0.         0.
  0.         0.         0.         0.         0.         0.
  0.         0.11111111]
 [0.         0.         0.         0.         0.16666667 0.
  0.         0.14285714 0.         0.         0.         0.
  0.         0.         0.         0.         0.         0.
  0.         0.11111111]
 [0.16666667 0.         0.16666667 0.16666667 0.         0.
  0.         0.14285714 0.         0.         0.         0.
  0.         0.         0.         0.         0.         0.

In [4]:
def load_dataset():
    transforms_mnist = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.1307,),(0.3081,))])
    mnist_data_train = datasets.MNIST('./data/mnist', train=True, download=True, transform=transforms_mnist)
    mnist_data_test = datasets.MNIST('./data/mnist', train=False, download=True, transform=transforms_mnist)

    return mnist_data_train, mnist_data_test

In [5]:
def degrees(A):
    """Return the degrees of each node of a graph from its adjacency matrix"""
    return np.sum(A, axis=0).reshape(A.shape[0], 1)

def node_degree(n, G):
    cnt = 0
    for i in G.neighbors(n):
        cnt += 1
    return cnt

def get_neighbors(n, G):
    neighbors_list = []
    for i in G.neighbors(n):
        neighbors_list.append(int(i))
    return neighbors_list

In [6]:
datapoints = {}
count = 0
W1 = np.array([2.0, 2.0])
W2 = np.array([-2.0, 2.0])
W = [W1, W2]
m = 200
n = 2
noise_sd = 0.001
for i, cluster_size in enumerate(cluster_sizes):
    for j in range(cluster_size):
        features = np.random.normal(loc=0.0, scale=1.0, size=(m, n))
        label = np.dot(features, W[i]) + np.random.normal(0,noise_sd)
        datapoints[count] = {
                'features': features,
                'degree': node_degree(count, G),
                'label': label,
                'neighbors': get_neighbors(count, G),
                'exact_weights': torch.from_numpy(W[i])
            }
        count += 1

In [7]:
class MyDataset(Dataset):
    def __init__(self, data, targets, transform=None):
        self.data = torch.FloatTensor(data)
        self.targets = torch.FloatTensor(targets).unsqueeze(-1)
        
    def __getitem__(self, index):
        x = self.data[index]
        y = self.targets[index]

        return x, y
    
    def __len__(self):
        return len(self.data)


In [8]:
class MLP_Net(nn.Module):
    def __init__(self, user_id):
        super(MLP_Net, self).__init__()
        self.fc1 = nn.Linear(2, 1, bias=False)
        #self.fc2 = nn.Linear(4, 1, bias=False)
        #self.fc3 = nn.Linear(200, 10)
        self.user_id = user_id

    def forward(self, x):
        x = torch.flatten(x, 1)
        #x = F.relu(self.fc1(x))
        output = self.fc1(x)
        #output = self.fc3(x)
        return output

In [9]:
from typing import Iterable, Optional

def grads_to_vector(parameters: Iterable[torch.Tensor]) -> torch.Tensor:
    r"""Convert parameters to one vector

    Args:
        parameters (Iterable[Tensor]): an iterator of Tensors that are the
            parameters of a model.

    Returns:
        The parameters represented by a single vector
    """
    # Flag for the device where the parameter is located
    param_device = None

    vec = []
    for param in parameters:
        # Ensure the parameters are located in the same device
        param_device = param.grad

        vec.append(param_device.view(-1))
    return torch.cat(vec)

In [10]:
model = MLP_Net(user_id=0)

lr = 0.01

dataloader = DataLoader(MyDataset(datapoints[19]["features"], datapoints[19]["label"]), batch_size=50, shuffle=False)
optimizer = torch.optim.SGD(model.parameters(), lr=0.01)
for i in range(100):
    for (x, y) in dataloader:
        criterion = nn.MSELoss()
        optimizer.zero_grad()
        yhat = model(x)
        print(y.size())
        print(yhat.size())
        loss = criterion(yhat, y)
        
        loss.backward()
        print(i, loss, grads_to_vector(model.parameters()), parameters_to_vector(model.parameters()))
        #optimizer.step()
        new_model = parameters_to_vector(model.parameters()) - lr * grads_to_vector(model.parameters())
        vector_to_parameters(parameters=model.parameters(), vec=new_model)
        #if i % 50 ==0:
            #lr *= 0.9
            

#parameters_to_vector(model.parameters())

torch.Size([50, 1])
torch.Size([50, 1])
0 tensor(10.0853, grad_fn=<MseLossBackward0>) tensor([ 4.2892, -4.2840]) tensor([ 0.5111, -0.1943], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
0 tensor(12.2048, grad_fn=<MseLossBackward0>) tensor([ 6.5189, -3.8671]) tensor([ 0.4682, -0.1514], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
0 tensor(7.2678, grad_fn=<MseLossBackward0>) tensor([ 3.8602, -2.4888]) tensor([ 0.4030, -0.1128], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
0 tensor(7.3562, grad_fn=<MseLossBackward0>) tensor([ 3.9552, -2.5681]) tensor([ 0.3644, -0.0879], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
1 tensor(8.7673, grad_fn=<MseLossBackward0>) tensor([ 3.9711, -4.0262]) tensor([ 0.3248, -0.0622], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
1 tensor(10.5703, grad_fn=<MseLossBackward0>) tensor([ 6.0182, -3.6542]) tensor([ 0.2851, -0.0219], grad_fn=<CatBackward0>)
torch.Size([50, 1])

16 tensor(0.7603, grad_fn=<MseLossBackward0>) tensor([ 1.0774, -0.9806]) tensor([-1.2881,  1.2319], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
16 tensor(0.7637, grad_fn=<MseLossBackward0>) tensor([ 1.1831, -0.9208]) tensor([-1.2989,  1.2417], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
17 tensor(0.9535, grad_fn=<MseLossBackward0>) tensor([ 1.1770, -1.4629]) tensor([-1.3107,  1.2509], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
17 tensor(1.0978, grad_fn=<MseLossBackward0>) tensor([ 1.7066, -1.4152]) tensor([-1.3225,  1.2655], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
17 tensor(0.6615, grad_fn=<MseLossBackward0>) tensor([ 0.9959, -0.9229]) tensor([-1.3396,  1.2797], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
17 tensor(0.6638, grad_fn=<MseLossBackward0>) tensor([ 1.0982, -0.8629]) tensor([-1.3495,  1.2889], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
18 tensor(0.8310

30 tensor(0.1086, grad_fn=<MseLossBackward0>) tensor([ 0.4212, -0.3687]) tensor([-1.7520,  1.6941], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
31 tensor(0.1399, grad_fn=<MseLossBackward0>) tensor([ 0.4162, -0.5903]) tensor([-1.7562,  1.6978], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
31 tensor(0.1572, grad_fn=<MseLossBackward0>) tensor([ 0.5826, -0.5903]) tensor([-1.7604,  1.7037], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
31 tensor(0.0956, grad_fn=<MseLossBackward0>) tensor([ 0.3362, -0.3874]) tensor([-1.7662,  1.7096], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
31 tensor(0.0945, grad_fn=<MseLossBackward0>) tensor([ 0.3915, -0.3452]) tensor([-1.7696,  1.7134], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
32 tensor(0.1220, grad_fn=<MseLossBackward0>) tensor([ 0.3867, -0.5529]) tensor([-1.7735,  1.7169], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
32 tensor(0.1370

45 tensor(0.0207, grad_fn=<MseLossBackward0>) tensor([ 0.1500, -0.2351]) tensor([-1.9121,  1.8796], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
45 tensor(0.0230, grad_fn=<MseLossBackward0>) tensor([ 0.2038, -0.2402]) tensor([-1.9136,  1.8820], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
45 tensor(0.0141, grad_fn=<MseLossBackward0>) tensor([ 0.1165, -0.1585]) tensor([-1.9156,  1.8844], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
45 tensor(0.0137, grad_fn=<MseLossBackward0>) tensor([ 0.1421, -0.1366]) tensor([-1.9168,  1.8860], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
46 tensor(0.0181, grad_fn=<MseLossBackward0>) tensor([ 0.1395, -0.2200]) tensor([-1.9182,  1.8873], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
46 tensor(0.0200, grad_fn=<MseLossBackward0>) tensor([ 0.1892, -0.2251]) tensor([-1.9196,  1.8895], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
46 tensor(0.0123

67 tensor(0.0011, grad_fn=<MseLossBackward0>) tensor([ 0.0408, -0.0567]) tensor([-1.9821,  1.9727], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
67 tensor(0.0007, grad_fn=<MseLossBackward0>) tensor([ 0.0232, -0.0378]) tensor([-1.9825,  1.9732], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
67 tensor(0.0007, grad_fn=<MseLossBackward0>) tensor([ 0.0296, -0.0312]) tensor([-1.9827,  1.9736], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
68 tensor(0.0009, grad_fn=<MseLossBackward0>) tensor([ 0.0289, -0.0509]) tensor([-1.9830,  1.9739], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
68 tensor(0.0010, grad_fn=<MseLossBackward0>) tensor([ 0.0380, -0.0530]) tensor([-1.9833,  1.9744], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
68 tensor(0.0006, grad_fn=<MseLossBackward0>) tensor([ 0.0216, -0.0354]) tensor([-1.9837,  1.9750], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
68 tensor(0.0006

87 tensor(5.1553e-05, grad_fn=<MseLossBackward0>) tensor([ 0.0057, -0.0103]) tensor([-1.9957,  1.9930], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
87 tensor(4.3020e-05, grad_fn=<MseLossBackward0>) tensor([ 0.0072, -0.0079]) tensor([-1.9958,  1.9931], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
88 tensor(6.1654e-05, grad_fn=<MseLossBackward0>) tensor([ 0.0070, -0.0133]) tensor([-1.9958,  1.9932], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
88 tensor(6.6669e-05, grad_fn=<MseLossBackward0>) tensor([ 0.0091, -0.0139]) tensor([-1.9959,  1.9933], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
88 tensor(4.5431e-05, grad_fn=<MseLossBackward0>) tensor([ 0.0053, -0.0096]) tensor([-1.9960,  1.9934], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([50, 1])
88 tensor(3.7590e-05, grad_fn=<MseLossBackward0>) tensor([ 0.0067, -0.0074]) tensor([-1.9960,  1.9935], grad_fn=<CatBackward0>)
torch.Size([50, 1])
torch.Size([

In [11]:
parameters_to_vector(model.parameters())

tensor([-1.9982,  1.9969], grad_fn=<CatBackward0>)

In [12]:
class CNN_Net(nn.Module):
    def __init__(self):
        super(CNN_Net, self).__init__()
        self.conv1 = nn.Conv2d(1, 32, kernel_size=5)
        self.conv2 = nn.Conv2d(32, 64, kernel_size=5)
        self.pool = nn.MaxPool2d(2,2)
        self.dropout = nn.Dropout(p=0.2)
        self.fc1 = nn.Linear(1024, 512)
        self.fc2 = nn.Linear(512, 10)

    def forward(self, x):
        x = self.pool(F.relu(self.conv1(x)))
        x = self.pool(F.relu(self.conv2(x)))
        x = self.dropout(x)
        x = torch.flatten(x, 1)
        x = F.relu(self.fc1(x))
        output = self.fc2(x)
        return output

In [13]:
class ClientUpdate(object):
    def __init__(self, dataset, batchSize, alpha, lamda, epochs, projection_list, projected_weights):
        self.train_loader = DataLoader(MyDataset(dataset["features"], dataset["label"]), batch_size=batchSize, shuffle=True)
        #self.learning_rate = learning_rate
        self.epochs = epochs
        self.batchSize = batchSize

    def train(self, model):
        criterion = nn.MSELoss()
        optimizer = torch.optim.SGD(model.parameters(), lr=1e-3, momentum=0.5)

        e_loss = []
        for epoch in range(1, self.epochs+1):
            train_loss = 0
            model.train()
            for i, (data, labels) in zip(range(1), self.train_loader):
                data, labels = data, labels
                optimizer.zero_grad() 
                output = model(data)  
                loss = criterion(output, labels)
                #loss += mu/2 * torch.norm(client_param.data - server_param.data)**2
                loss.backward()
                grads = grads_to_vector(model.parameters())
                #optimizer.step()
                train_loss += loss.item()*data.size(0)
                weights = parameters_to_vector(model.parameters())
                mat_vec_sum = torch.zeros_like(weights)
                for j in G.neighbors(model.user_id):
                    mat_vec_sum = torch.add(mat_vec_sum, torch.matmul(torch.transpose(projection_list[model.user_id][j], 0, 1), 
                                                         projected_weights[j][model.user_id] - projected_weights[model.user_id][j]))
                
                model_update = parameters_to_vector(model.parameters()) - alpha * (grads + lamda * mat_vec_sum)
                
            vector_to_parameters(parameters=model.parameters(), vec=model_update)
                

            train_loss = train_loss/self.batchSize#len(self.train_loader.dataset) 
            e_loss.append(train_loss)

        total_loss = e_loss#sum(e_loss)/len(e_loss)

        return model.state_dict(), total_loss

In [14]:
# Preparing projection matrices
models = [MLP_Net(user_id=i) for i in range(no_users)]
#temp = MLP_Net()
projection_list = []
projected_weights = []

def update_ProjWeight(projection_list, projected_weights, first_run=True):
    #projected_weights = []
    for i in range(no_users):
        neighbors_mat = []
        neighbors_weights = []
        for j in range(no_users):
            if j in G.neighbors(i):
                with torch.no_grad():
                    if first_run == True:
                        row, column = parameters_to_vector(models[j].parameters()).size()[0], parameters_to_vector(models[i].parameters()).size()[0]
                        mat = torch.zeros((row, column))
                        mat.fill_diagonal_(1.0 + 1.0 * float(np.random.randn(1)))
                        neighbors_mat.append(mat)
                        neighbors_weights.append(torch.matmul(mat, parameters_to_vector(models[j].parameters())))
                    else:
                        neighbors_weights.append(torch.matmul(projection_list[j][i], parameters_to_vector(models[j].parameters())))
            else:
                neighbors_mat.append(0)
                neighbors_weights.append(0)
        if first_run == True:
            projection_list.append(neighbors_mat)
        projected_weights.append(neighbors_weights)

update_ProjWeight(projection_list, projected_weights)



In [15]:
print(projection_list[0])

[0, tensor([[1.6434, 0.0000],
        [0.0000, 1.6434]]), tensor([[-0.6775,  0.0000],
        [ 0.0000, -0.6775]]), tensor([[0.2411, 0.0000],
        [0.0000, 0.2411]]), tensor([[1.8230, 0.0000],
        [0.0000, 1.8230]]), tensor([[1.3884, 0.0000],
        [0.0000, 1.3884]]), tensor([[1.7704, 0.0000],
        [0.0000, 1.7704]]), 0, tensor([[-0.1809,  0.0000],
        [ 0.0000, -0.1809]]), tensor([[0.6027, 0.0000],
        [0.0000, 0.6027]]), 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]


In [16]:
def testing(model, dataset, bs, criterion): 
    test_loss = 0
    correct = 0
    test_loader = DataLoader(MyDataset(dataset["features"], dataset["label"]), batch_size=bs)
    l = len(test_loader)
    model.eval()
    for data, labels in test_loader:
        data, labels = data, labels
        output = model(data)
        loss = criterion(output, labels)
        test_loss += loss.item()*data.size(0)
        #_, pred = torch.max(output, 1)
        #correct += pred.eq(labels.data.view_as(pred)).sum().item()
    
    test_loss /= len(test_loader.dataset)
    
    return test_loss

In [17]:
def rel_error(model):
    return (torch.norm(parameters_to_vector(model.parameters()) - datapoints[model.user_id]['exact_weights']) / torch.norm(datapoints[model.user_id]['exact_weights'])).detach()

In [18]:
torch.norm(datapoints[model.user_id]['exact_weights'])

tensor(2.8284, dtype=torch.float64)

In [19]:
model = MLP_Net(user_id=0)

from torch.nn.utils import parameters_to_vector, vector_to_parameters

with torch.no_grad():    
    params = parameters_to_vector(model.parameters())

    print(params)

params *= 2.

vector_to_parameters(parameters=model.parameters(), vec=params)

parameters_to_vector(model.parameters())





tensor([-0.4948,  0.1582])


tensor([-0.9895,  0.3165], grad_fn=<CatBackward0>)

In [20]:
#global_model = CNN_Net().cuda()
models = [MLP_Net(user_id=i) for i in range(no_users)]
dummy_models = [MLP_Net(user_id=i) for i in range(no_users)]

#model.load_state_dict(global_model.state_dict())

criterion = nn.MSELoss()


train_loss = []
test_loss = []
test_accuracy = []
total_rel_error = []

for curr_round in tqdm(range(1, it+1)):
    w, local_loss = [], []

    
    for i in range(no_users):
        dummy_models[i].load_state_dict(models[i].state_dict())
        local_update = ClientUpdate(dataset=datapoints[i], batchSize=batch_size, alpha=alpha, lamda=lamda, epochs=1, projection_list=projection_list, projected_weights=projected_weights)
        weights, loss = local_update.train(dummy_models[i])
        w.append(weights)
        local_loss.append(loss)
        models[i].load_state_dict(w[i])
        
    
    
    # Update prjection matrix
    
    #print(projection_list[0], projected_weights[0])
    
    for i in range(no_users):
        weights = parameters_to_vector(models[i].parameters())
        for j in G.neighbors(i):
            mat_vec_sum = torch.zeros_like(weights)
            for k in G.neighbors(i):
                mat_vec_sum = torch.add(mat_vec_sum, projected_weights[k][i] - projected_weights[i][k])
            #print(torch.outer(mat_vec_sum, weights))

            projection_list[i][j] = torch.add(projection_list[i][j], -1 * eta * lamda * mat_vec_sum)
                                         
    projected_weights = []                                          
    update_ProjWeight(projection_list, projected_weights, first_run=False)
        
        
        
    
    




          
            

    local_test_acc = []
    local_test_loss = []
    user_rel_error = 0
    for k in range(no_users):
      
        g_loss = testing(models[i], datapoints[i], 50, criterion)
        local_test_loss.append(g_loss)
        user_rel_error += rel_error(models[i])
    
    
        

    g_loss = sum(local_test_loss) / len(local_test_loss)
    total_rel_error.append(user_rel_error / no_users)
    
    

    test_loss.append(g_loss)
    #test_accuracy.append(g_accuracy)
    print("Training_loss %2.5f,   Relative Error %2.5f"% (test_loss[-1], total_rel_error[-1]))

  0%|          | 1/2000 [00:00<03:29,  9.55it/s]

Training_loss 8.87526,   Relative Error 1.14112


  0%|          | 3/2000 [00:00<02:52, 11.55it/s]

Training_loss 8.84790,   Relative Error 1.13935
Training_loss 8.80522,   Relative Error 1.13668
Training_loss 8.78304,   Relative Error 1.13521


  0%|          | 5/2000 [00:00<02:54, 11.40it/s]

Training_loss 8.75723,   Relative Error 1.13353
Training_loss 8.73376,   Relative Error 1.13198


  0%|          | 7/2000 [00:00<02:54, 11.44it/s]

Training_loss 8.69203,   Relative Error 1.12930


  0%|          | 9/2000 [00:00<02:51, 11.59it/s]

Training_loss 8.66784,   Relative Error 1.12774
Training_loss 8.65956,   Relative Error 1.12721
Training_loss 8.64057,   Relative Error 1.12598


  1%|          | 11/2000 [00:00<02:51, 11.58it/s]

Training_loss 8.60336,   Relative Error 1.12361
Training_loss 8.58259,   Relative Error 1.12226


  1%|          | 13/2000 [00:01<02:48, 11.82it/s]

Training_loss 8.54953,   Relative Error 1.12011


  1%|          | 15/2000 [00:01<02:52, 11.53it/s]

Training_loss 8.52173,   Relative Error 1.11830
Training_loss 8.47444,   Relative Error 1.11517
Training_loss 8.44324,   Relative Error 1.11313


  1%|          | 17/2000 [00:01<02:52, 11.50it/s]

Training_loss 8.41328,   Relative Error 1.11115
Training_loss 8.39091,   Relative Error 1.10966


  1%|          | 19/2000 [00:01<02:59, 11.04it/s]

Training_loss 8.37538,   Relative Error 1.10869
Training_loss 8.35130,   Relative Error 1.10711


  1%|          | 21/2000 [00:01<03:09, 10.43it/s]

Training_loss 8.32885,   Relative Error 1.10561
Training_loss 8.30229,   Relative Error 1.10387


  1%|          | 23/2000 [00:02<03:06, 10.58it/s]

Training_loss 8.27994,   Relative Error 1.10237


  1%|▏         | 25/2000 [00:02<02:58, 11.06it/s]

Training_loss 8.25134,   Relative Error 1.10045
Training_loss 8.23782,   Relative Error 1.09953
Training_loss 8.21364,   Relative Error 1.09794


  1%|▏         | 27/2000 [00:02<02:58, 11.05it/s]

Training_loss 8.19676,   Relative Error 1.09681
Training_loss 8.16802,   Relative Error 1.09485


  1%|▏         | 29/2000 [00:02<02:55, 11.24it/s]

Training_loss 8.15565,   Relative Error 1.09401


  2%|▏         | 31/2000 [00:02<02:56, 11.18it/s]

Training_loss 8.10694,   Relative Error 1.09070
Training_loss 8.07629,   Relative Error 1.08865
Training_loss 8.04075,   Relative Error 1.08629


  2%|▏         | 33/2000 [00:02<02:57, 11.07it/s]

Training_loss 8.02058,   Relative Error 1.08493
Training_loss 7.99006,   Relative Error 1.08281


  2%|▏         | 36/2000 [00:03<04:59,  6.55it/s]

Training_loss 7.94249,   Relative Error 1.07957
Training_loss 7.91786,   Relative Error 1.07791


  2%|▏         | 38/2000 [00:03<04:43,  6.93it/s]

Training_loss 7.89342,   Relative Error 1.07620
Training_loss 7.87190,   Relative Error 1.07471


  2%|▏         | 41/2000 [00:04<03:55,  8.30it/s]

Training_loss 7.84299,   Relative Error 1.07280
Training_loss 7.80436,   Relative Error 1.07018
Training_loss 7.77748,   Relative Error 1.06840


  2%|▏         | 43/2000 [00:04<03:21,  9.73it/s]

Training_loss 7.75856,   Relative Error 1.06709
Training_loss 7.74307,   Relative Error 1.06600
Training_loss 7.72230,   Relative Error 1.06456


  2%|▏         | 47/2000 [00:04<02:52, 11.34it/s]

Training_loss 7.70628,   Relative Error 1.06345
Training_loss 7.67454,   Relative Error 1.06127
Training_loss 7.65664,   Relative Error 1.06005


  2%|▏         | 49/2000 [00:04<02:43, 11.97it/s]

Training_loss 7.63680,   Relative Error 1.05866
Training_loss 7.60779,   Relative Error 1.05664
Training_loss 7.56876,   Relative Error 1.05387


  3%|▎         | 53/2000 [00:05<02:35, 12.49it/s]

Training_loss 7.55453,   Relative Error 1.05286
Training_loss 7.53202,   Relative Error 1.05133
Training_loss 7.50612,   Relative Error 1.04953


  3%|▎         | 55/2000 [00:05<02:34, 12.59it/s]

Training_loss 7.48118,   Relative Error 1.04778
Training_loss 7.46739,   Relative Error 1.04684
Training_loss 7.44034,   Relative Error 1.04498


  3%|▎         | 59/2000 [00:05<02:37, 12.35it/s]

Training_loss 7.41367,   Relative Error 1.04313
Training_loss 7.39470,   Relative Error 1.04182
Training_loss 7.35006,   Relative Error 1.03858


  3%|▎         | 61/2000 [00:05<02:51, 11.33it/s]

Training_loss 7.32808,   Relative Error 1.03703
Training_loss 7.30978,   Relative Error 1.03575


  3%|▎         | 63/2000 [00:06<03:05, 10.46it/s]

Training_loss 7.27630,   Relative Error 1.03336
Training_loss 7.25516,   Relative Error 1.03188
Training_loss 7.21488,   Relative Error 1.02908


  3%|▎         | 67/2000 [00:06<02:50, 11.32it/s]

Training_loss 7.18814,   Relative Error 1.02725
Training_loss 7.17767,   Relative Error 1.02649
Training_loss 7.16577,   Relative Error 1.02564


  3%|▎         | 69/2000 [00:06<02:41, 11.94it/s]

Training_loss 7.13498,   Relative Error 1.02347
Training_loss 7.11491,   Relative Error 1.02206
Training_loss 7.09102,   Relative Error 1.02036


  4%|▎         | 73/2000 [00:07<03:01, 10.63it/s]

Training_loss 7.06211,   Relative Error 1.01831
Training_loss 7.04013,   Relative Error 1.01675
Training_loss 7.00785,   Relative Error 1.01441


  4%|▍         | 75/2000 [00:07<03:00, 10.65it/s]

Training_loss 6.98230,   Relative Error 1.01257
Training_loss 6.95835,   Relative Error 1.01084
Training_loss 6.92355,   Relative Error 1.00833


  4%|▍         | 79/2000 [00:07<02:55, 10.93it/s]

Training_loss 6.88774,   Relative Error 1.00576
Training_loss 6.84080,   Relative Error 1.00229
Training_loss 6.80922,   Relative Error 1.00000


  4%|▍         | 81/2000 [00:07<02:49, 11.32it/s]

Training_loss 6.79340,   Relative Error 0.99885
Training_loss 6.76408,   Relative Error 0.99670
Training_loss 6.72994,   Relative Error 0.99412


  4%|▍         | 85/2000 [00:08<02:45, 11.60it/s]

Training_loss 6.70627,   Relative Error 0.99235
Training_loss 6.68220,   Relative Error 0.99054
Training_loss 6.65851,   Relative Error 0.98876


  4%|▍         | 87/2000 [00:08<02:41, 11.81it/s]

Training_loss 6.64313,   Relative Error 0.98759
Training_loss 6.62330,   Relative Error 0.98612


  4%|▍         | 89/2000 [00:08<03:00, 10.61it/s]

Training_loss 6.59555,   Relative Error 0.98411
Training_loss 6.56866,   Relative Error 0.98207
Training_loss 6.54780,   Relative Error 0.98050


  5%|▍         | 93/2000 [00:08<03:00, 10.57it/s]

Training_loss 6.53029,   Relative Error 0.97918
Training_loss 6.51302,   Relative Error 0.97790
Training_loss 6.48843,   Relative Error 0.97604


  5%|▍         | 95/2000 [00:08<02:58, 10.69it/s]

Training_loss 6.46972,   Relative Error 0.97462
Training_loss 6.43198,   Relative Error 0.97184
Training_loss 6.41116,   Relative Error 0.97026


  5%|▍         | 99/2000 [00:09<02:53, 10.98it/s]

Training_loss 6.39440,   Relative Error 0.96901
Training_loss 6.38009,   Relative Error 0.96796
Training_loss 6.34505,   Relative Error 0.96527


  5%|▌         | 101/2000 [00:09<02:48, 11.27it/s]

Training_loss 6.31486,   Relative Error 0.96300
Training_loss 6.30247,   Relative Error 0.96205
Training_loss 6.27256,   Relative Error 0.95972


  5%|▌         | 105/2000 [00:09<02:42, 11.67it/s]

Training_loss 6.24771,   Relative Error 0.95781
Training_loss 6.21479,   Relative Error 0.95534
Training_loss 6.18422,   Relative Error 0.95297


  5%|▌         | 107/2000 [00:10<03:04, 10.24it/s]

Training_loss 6.16731,   Relative Error 0.95163
Training_loss 6.14816,   Relative Error 0.95016
Training_loss 6.12874,   Relative Error 0.94866


  5%|▌         | 109/2000 [00:10<03:05, 10.20it/s]

Training_loss 6.10713,   Relative Error 0.94701
Training_loss 6.08323,   Relative Error 0.94516


  6%|▌         | 113/2000 [00:10<03:04, 10.25it/s]

Training_loss 6.05429,   Relative Error 0.94287
Training_loss 6.04058,   Relative Error 0.94181
Training_loss 6.02367,   Relative Error 0.94047


  6%|▌         | 115/2000 [00:10<02:58, 10.56it/s]

Training_loss 6.00244,   Relative Error 0.93879
Training_loss 5.98058,   Relative Error 0.93711
Training_loss 5.96181,   Relative Error 0.93558


  6%|▌         | 119/2000 [00:11<02:44, 11.46it/s]

Training_loss 5.93589,   Relative Error 0.93352
Training_loss 5.92324,   Relative Error 0.93252
Training_loss 5.90364,   Relative Error 0.93095


  6%|▌         | 121/2000 [00:11<02:45, 11.34it/s]

Training_loss 5.87999,   Relative Error 0.92909
Training_loss 5.86722,   Relative Error 0.92809
Training_loss 5.84960,   Relative Error 0.92671


  6%|▋         | 125/2000 [00:11<02:48, 11.13it/s]

Training_loss 5.82908,   Relative Error 0.92508
Training_loss 5.81701,   Relative Error 0.92410
Training_loss 5.79581,   Relative Error 0.92241


  6%|▋         | 127/2000 [00:11<02:40, 11.64it/s]

Training_loss 5.76154,   Relative Error 0.91969
Training_loss 5.73958,   Relative Error 0.91792
Training_loss 5.71059,   Relative Error 0.91559


  7%|▋         | 131/2000 [00:12<02:53, 10.80it/s]

Training_loss 5.69378,   Relative Error 0.91425
Training_loss 5.68022,   Relative Error 0.91316
Training_loss 5.65640,   Relative Error 0.91130


  7%|▋         | 133/2000 [00:12<02:46, 11.19it/s]

Training_loss 5.63848,   Relative Error 0.90983
Training_loss 5.62530,   Relative Error 0.90873
Training_loss 5.60766,   Relative Error 0.90731


  7%|▋         | 137/2000 [00:12<02:53, 10.76it/s]

Training_loss 5.59275,   Relative Error 0.90612
Training_loss 5.57315,   Relative Error 0.90457
Training_loss 5.55189,   Relative Error 0.90278


  7%|▋         | 139/2000 [00:13<02:47, 11.13it/s]

Training_loss 5.53816,   Relative Error 0.90167
Training_loss 5.52701,   Relative Error 0.90075
Training_loss 5.50561,   Relative Error 0.89899


  7%|▋         | 143/2000 [00:13<02:45, 11.25it/s]

Training_loss 5.49389,   Relative Error 0.89804
Training_loss 5.47669,   Relative Error 0.89662
Training_loss 5.46425,   Relative Error 0.89562


  7%|▋         | 145/2000 [00:13<02:44, 11.26it/s]

Training_loss 5.44863,   Relative Error 0.89435
Training_loss 5.44073,   Relative Error 0.89370
Training_loss 5.41928,   Relative Error 0.89194


  7%|▋         | 149/2000 [00:13<02:52, 10.75it/s]

Training_loss 5.39356,   Relative Error 0.88982
Training_loss 5.37767,   Relative Error 0.88853
Training_loss 5.35947,   Relative Error 0.88700


  8%|▊         | 151/2000 [00:14<02:53, 10.69it/s]

Training_loss 5.34632,   Relative Error 0.88595
Training_loss 5.32487,   Relative Error 0.88415


  8%|▊         | 153/2000 [00:14<02:59, 10.31it/s]

Training_loss 5.30495,   Relative Error 0.88253
Training_loss 5.28630,   Relative Error 0.88097
Training_loss 5.24926,   Relative Error 0.87785


  8%|▊         | 157/2000 [00:14<03:00, 10.19it/s]

Training_loss 5.23189,   Relative Error 0.87641
Training_loss 5.21380,   Relative Error 0.87493
Training_loss 5.19074,   Relative Error 0.87302


  8%|▊         | 159/2000 [00:14<03:03, 10.04it/s]

Training_loss 5.18012,   Relative Error 0.87214
Training_loss 5.16437,   Relative Error 0.87084


  8%|▊         | 161/2000 [00:15<03:09,  9.69it/s]

Training_loss 5.14495,   Relative Error 0.86922
Training_loss 5.13115,   Relative Error 0.86807


  8%|▊         | 164/2000 [00:15<03:04,  9.94it/s]

Training_loss 5.11000,   Relative Error 0.86621
Training_loss 5.09513,   Relative Error 0.86492
Training_loss 5.07904,   Relative Error 0.86356


  8%|▊         | 166/2000 [00:15<03:01, 10.09it/s]

Training_loss 5.05521,   Relative Error 0.86153
Training_loss 5.03946,   Relative Error 0.86017
Training_loss 5.02315,   Relative Error 0.85881


  8%|▊         | 169/2000 [00:15<03:11,  9.56it/s]

Training_loss 5.00418,   Relative Error 0.85718
Training_loss 4.99583,   Relative Error 0.85644


  9%|▊         | 171/2000 [00:16<03:08,  9.70it/s]

Training_loss 4.97548,   Relative Error 0.85471
Training_loss 4.96172,   Relative Error 0.85349
Training_loss 4.93957,   Relative Error 0.85158


  9%|▉         | 175/2000 [00:16<02:50, 10.68it/s]

Training_loss 4.92141,   Relative Error 0.85003
Training_loss 4.90361,   Relative Error 0.84853
Training_loss 4.88463,   Relative Error 0.84689


  9%|▉         | 177/2000 [00:16<02:50, 10.71it/s]

Training_loss 4.86548,   Relative Error 0.84523
Training_loss 4.84252,   Relative Error 0.84322
Training_loss 4.82971,   Relative Error 0.84213


  9%|▉         | 181/2000 [00:17<02:55, 10.39it/s]

Training_loss 4.80523,   Relative Error 0.83995
Training_loss 4.79328,   Relative Error 0.83894
Training_loss 4.78331,   Relative Error 0.83806


  9%|▉         | 183/2000 [00:17<02:49, 10.74it/s]

Training_loss 4.76633,   Relative Error 0.83659
Training_loss 4.73950,   Relative Error 0.83424
Training_loss 4.71967,   Relative Error 0.83249


  9%|▉         | 187/2000 [00:17<02:40, 11.31it/s]

Training_loss 4.70650,   Relative Error 0.83132
Training_loss 4.68950,   Relative Error 0.82983
Training_loss 4.66932,   Relative Error 0.82808


  9%|▉         | 189/2000 [00:17<02:42, 11.16it/s]

Training_loss 4.66084,   Relative Error 0.82735
Training_loss 4.63940,   Relative Error 0.82544


 10%|▉         | 191/2000 [00:18<02:51, 10.54it/s]

Training_loss 4.62068,   Relative Error 0.82380
Training_loss 4.60796,   Relative Error 0.82268
Training_loss 4.58916,   Relative Error 0.82102


 10%|▉         | 195/2000 [00:18<02:49, 10.64it/s]

Training_loss 4.58407,   Relative Error 0.82056
Training_loss 4.56926,   Relative Error 0.81923
Training_loss 4.56021,   Relative Error 0.81840


 10%|▉         | 197/2000 [00:18<02:47, 10.77it/s]

Training_loss 4.54659,   Relative Error 0.81717
Training_loss 4.53282,   Relative Error 0.81594
Training_loss 4.51296,   Relative Error 0.81412


 10%|█         | 201/2000 [00:18<02:49, 10.62it/s]

Training_loss 4.50030,   Relative Error 0.81295
Training_loss 4.48220,   Relative Error 0.81129
Training_loss 4.45995,   Relative Error 0.80923


 10%|█         | 203/2000 [00:19<02:52, 10.39it/s]

Training_loss 4.44271,   Relative Error 0.80766
Training_loss 4.42442,   Relative Error 0.80602
Training_loss 4.41594,   Relative Error 0.80521


 10%|█         | 207/2000 [00:19<02:38, 11.30it/s]

Training_loss 4.39494,   Relative Error 0.80329
Training_loss 4.37720,   Relative Error 0.80170
Training_loss 4.37034,   Relative Error 0.80107


 10%|█         | 209/2000 [00:19<02:33, 11.64it/s]

Training_loss 4.35555,   Relative Error 0.79973
Training_loss 4.33596,   Relative Error 0.79789
Training_loss 4.32863,   Relative Error 0.79723


 11%|█         | 213/2000 [00:19<02:35, 11.48it/s]

Training_loss 4.32320,   Relative Error 0.79677
Training_loss 4.31232,   Relative Error 0.79578
Training_loss 4.29302,   Relative Error 0.79397


 11%|█         | 215/2000 [00:20<02:42, 11.00it/s]

Training_loss 4.28190,   Relative Error 0.79298
Training_loss 4.27468,   Relative Error 0.79232
Training_loss 4.25765,   Relative Error 0.79074


 11%|█         | 219/2000 [00:20<02:39, 11.19it/s]

Training_loss 4.24488,   Relative Error 0.78954
Training_loss 4.23567,   Relative Error 0.78869
Training_loss 4.22755,   Relative Error 0.78793


 11%|█         | 221/2000 [00:20<03:47,  7.81it/s]

Training_loss 4.21324,   Relative Error 0.78657
Training_loss 4.20310,   Relative Error 0.78559


 11%|█         | 224/2000 [00:21<03:28,  8.52it/s]

Training_loss 4.18883,   Relative Error 0.78426
Training_loss 4.17905,   Relative Error 0.78337
Training_loss 4.16518,   Relative Error 0.78201


 11%|█▏        | 227/2000 [00:21<02:57,  9.98it/s]

Training_loss 4.15621,   Relative Error 0.78117
Training_loss 4.13482,   Relative Error 0.77917
Training_loss 4.12039,   Relative Error 0.77780


 11%|█▏        | 229/2000 [00:21<02:44, 10.76it/s]

Training_loss 4.11303,   Relative Error 0.77712
Training_loss 4.09977,   Relative Error 0.77588
Training_loss 4.08463,   Relative Error 0.77444


 12%|█▏        | 233/2000 [00:22<02:31, 11.63it/s]

Training_loss 4.07081,   Relative Error 0.77315
Training_loss 4.06505,   Relative Error 0.77260
Training_loss 4.05496,   Relative Error 0.77167


 12%|█▏        | 235/2000 [00:22<02:36, 11.31it/s]

Training_loss 4.04852,   Relative Error 0.77104
Training_loss 4.02926,   Relative Error 0.76924
Training_loss 4.02080,   Relative Error 0.76844


 12%|█▏        | 239/2000 [00:22<02:42, 10.85it/s]

Training_loss 4.01250,   Relative Error 0.76768
Training_loss 4.00702,   Relative Error 0.76715
Training_loss 3.99492,   Relative Error 0.76598


 12%|█▏        | 241/2000 [00:22<02:54, 10.09it/s]

Training_loss 3.98740,   Relative Error 0.76523
Training_loss 3.97588,   Relative Error 0.76411


 12%|█▏        | 243/2000 [00:23<03:13,  9.06it/s]

Training_loss 3.96000,   Relative Error 0.76259
Training_loss 3.94934,   Relative Error 0.76156


 12%|█▏        | 246/2000 [00:23<03:03,  9.54it/s]

Training_loss 3.93040,   Relative Error 0.75973
Training_loss 3.91815,   Relative Error 0.75853
Training_loss 3.91269,   Relative Error 0.75799


 12%|█▏        | 249/2000 [00:23<02:45, 10.61it/s]

Training_loss 3.90179,   Relative Error 0.75694
Training_loss 3.89093,   Relative Error 0.75589
Training_loss 3.87713,   Relative Error 0.75456


 13%|█▎        | 251/2000 [00:23<02:43, 10.72it/s]

Training_loss 3.86128,   Relative Error 0.75305
Training_loss 3.85073,   Relative Error 0.75202
Training_loss 3.84373,   Relative Error 0.75134


 13%|█▎        | 253/2000 [00:23<02:37, 11.11it/s]

Training_loss 3.82869,   Relative Error 0.74982
Training_loss 3.81075,   Relative Error 0.74805


 13%|█▎        | 256/2000 [00:24<03:26,  8.44it/s]

Training_loss 3.79646,   Relative Error 0.74663
Training_loss 3.78762,   Relative Error 0.74573
Training_loss 3.77969,   Relative Error 0.74496


 13%|█▎        | 260/2000 [00:24<03:03,  9.50it/s]

Training_loss 3.77015,   Relative Error 0.74399
Training_loss 3.76204,   Relative Error 0.74319
Training_loss 3.75649,   Relative Error 0.74264


 13%|█▎        | 262/2000 [00:25<02:48, 10.31it/s]

Training_loss 3.74755,   Relative Error 0.74175
Training_loss 3.73851,   Relative Error 0.74085
Training_loss 3.73434,   Relative Error 0.74044


 13%|█▎        | 266/2000 [00:25<02:32, 11.35it/s]

Training_loss 3.72708,   Relative Error 0.73971
Training_loss 3.71424,   Relative Error 0.73845
Training_loss 3.70607,   Relative Error 0.73762


 13%|█▎        | 268/2000 [00:25<02:32, 11.33it/s]

Training_loss 3.68737,   Relative Error 0.73575
Training_loss 3.67298,   Relative Error 0.73434
Training_loss 3.65019,   Relative Error 0.73203


 14%|█▎        | 270/2000 [00:25<02:32, 11.33it/s]

Training_loss 3.63502,   Relative Error 0.73048
Training_loss 3.62739,   Relative Error 0.72967


 14%|█▎        | 272/2000 [00:25<02:44, 10.52it/s]

Training_loss 3.61157,   Relative Error 0.72809
Training_loss 3.60085,   Relative Error 0.72698


 14%|█▍        | 276/2000 [00:26<02:48, 10.25it/s]

Training_loss 3.59107,   Relative Error 0.72597
Training_loss 3.58188,   Relative Error 0.72502
Training_loss 3.56867,   Relative Error 0.72369


 14%|█▍        | 278/2000 [00:26<02:52,  9.97it/s]

Training_loss 3.55693,   Relative Error 0.72252
Training_loss 3.54643,   Relative Error 0.72143
Training_loss 3.53257,   Relative Error 0.72001


 14%|█▍        | 282/2000 [00:26<02:43, 10.54it/s]

Training_loss 3.52504,   Relative Error 0.71926
Training_loss 3.51057,   Relative Error 0.71776
Training_loss 3.50515,   Relative Error 0.71719


 14%|█▍        | 284/2000 [00:27<02:38, 10.81it/s]

Training_loss 3.49531,   Relative Error 0.71618
Training_loss 3.48098,   Relative Error 0.71474
Training_loss 3.46782,   Relative Error 0.71340


 14%|█▍        | 288/2000 [00:27<02:37, 10.90it/s]

Training_loss 3.46131,   Relative Error 0.71272
Training_loss 3.45146,   Relative Error 0.71173
Training_loss 3.44369,   Relative Error 0.71094


 14%|█▍        | 290/2000 [00:27<02:45, 10.35it/s]

Training_loss 3.43377,   Relative Error 0.70994
Training_loss 3.42432,   Relative Error 0.70895


 15%|█▍        | 292/2000 [00:27<02:46, 10.27it/s]

Training_loss 3.41230,   Relative Error 0.70771
Training_loss 3.40570,   Relative Error 0.70702


 15%|█▍        | 294/2000 [00:28<02:44, 10.37it/s]

Training_loss 3.39150,   Relative Error 0.70556
Training_loss 3.38212,   Relative Error 0.70456
Training_loss 3.36982,   Relative Error 0.70326


 15%|█▍        | 298/2000 [00:28<02:30, 11.31it/s]

Training_loss 3.36108,   Relative Error 0.70238
Training_loss 3.35240,   Relative Error 0.70152
Training_loss 3.34505,   Relative Error 0.70071


 15%|█▌        | 300/2000 [00:28<02:42, 10.48it/s]

Training_loss 3.34088,   Relative Error 0.70029
Training_loss 3.33636,   Relative Error 0.69981


 15%|█▌        | 302/2000 [00:28<02:43, 10.38it/s]

Training_loss 3.32882,   Relative Error 0.69900
Training_loss 3.32495,   Relative Error 0.69861
Training_loss 3.31952,   Relative Error 0.69803


 15%|█▌        | 306/2000 [00:29<02:32, 11.13it/s]

Training_loss 3.31452,   Relative Error 0.69751
Training_loss 3.29192,   Relative Error 0.69508
Training_loss 3.28512,   Relative Error 0.69436


 15%|█▌        | 308/2000 [00:29<02:59,  9.41it/s]

Training_loss 3.27666,   Relative Error 0.69348
Training_loss 3.27218,   Relative Error 0.69299


 15%|█▌        | 309/2000 [00:29<04:11,  6.72it/s]

Training_loss 3.26174,   Relative Error 0.69189


 16%|█▌        | 310/2000 [00:29<04:38,  6.07it/s]

Training_loss 3.25306,   Relative Error 0.69096


 16%|█▌        | 312/2000 [00:30<05:18,  5.31it/s]

Training_loss 3.24685,   Relative Error 0.69034
Training_loss 3.23893,   Relative Error 0.68951


 16%|█▌        | 314/2000 [00:30<04:55,  5.70it/s]

Training_loss 3.22021,   Relative Error 0.68750
Training_loss 3.21228,   Relative Error 0.68667


 16%|█▌        | 317/2000 [00:30<03:17,  8.51it/s]

Training_loss 3.20532,   Relative Error 0.68592
Training_loss 3.19277,   Relative Error 0.68461
Training_loss 3.18890,   Relative Error 0.68420


 16%|█▌        | 319/2000 [00:31<03:38,  7.68it/s]

Training_loss 3.18179,   Relative Error 0.68344
Training_loss 3.17977,   Relative Error 0.68323


 16%|█▌        | 321/2000 [00:31<03:56,  7.09it/s]

Training_loss 3.17452,   Relative Error 0.68266
Training_loss 3.16269,   Relative Error 0.68139


 16%|█▌        | 323/2000 [00:31<03:41,  7.56it/s]

Training_loss 3.14756,   Relative Error 0.67976
Training_loss 3.14262,   Relative Error 0.67921


 16%|█▋        | 326/2000 [00:32<03:04,  9.07it/s]

Training_loss 3.13232,   Relative Error 0.67811
Training_loss 3.12537,   Relative Error 0.67735
Training_loss 3.12104,   Relative Error 0.67688


 16%|█▋        | 328/2000 [00:32<02:53,  9.62it/s]

Training_loss 3.11370,   Relative Error 0.67608
Training_loss 3.10310,   Relative Error 0.67492
Training_loss 3.09298,   Relative Error 0.67379


 16%|█▋        | 330/2000 [00:32<02:47,  9.96it/s]

Training_loss 3.07993,   Relative Error 0.67236
Training_loss 3.06868,   Relative Error 0.67113


 17%|█▋        | 333/2000 [00:32<02:51,  9.74it/s]

Training_loss 3.05645,   Relative Error 0.66979
Training_loss 3.04939,   Relative Error 0.66904


 17%|█▋        | 335/2000 [00:33<03:04,  9.03it/s]

Training_loss 3.04011,   Relative Error 0.66801
Training_loss 3.03350,   Relative Error 0.66728


 17%|█▋        | 337/2000 [00:33<02:53,  9.57it/s]

Training_loss 3.02552,   Relative Error 0.66642
Training_loss 3.01726,   Relative Error 0.66550
Training_loss 3.01223,   Relative Error 0.66495


 17%|█▋        | 341/2000 [00:33<02:32, 10.90it/s]

Training_loss 3.00262,   Relative Error 0.66386
Training_loss 2.99338,   Relative Error 0.66289
Training_loss 2.98926,   Relative Error 0.66244


 17%|█▋        | 343/2000 [00:33<02:27, 11.22it/s]

Training_loss 2.98654,   Relative Error 0.66214
Training_loss 2.98199,   Relative Error 0.66161
Training_loss 2.97336,   Relative Error 0.66064


 17%|█▋        | 347/2000 [00:34<02:21, 11.67it/s]

Training_loss 2.96750,   Relative Error 0.65998
Training_loss 2.96261,   Relative Error 0.65942
Training_loss 2.95134,   Relative Error 0.65817


 17%|█▋        | 349/2000 [00:34<02:19, 11.83it/s]

Training_loss 2.94080,   Relative Error 0.65701
Training_loss 2.92728,   Relative Error 0.65550


 18%|█▊        | 351/2000 [00:34<02:32, 10.81it/s]

Training_loss 2.92306,   Relative Error 0.65503
Training_loss 2.91178,   Relative Error 0.65380
Training_loss 2.90258,   Relative Error 0.65276


 18%|█▊        | 354/2000 [00:35<03:37,  7.58it/s]

Training_loss 2.89463,   Relative Error 0.65186
Training_loss 2.88805,   Relative Error 0.65114


 18%|█▊        | 356/2000 [00:35<04:37,  5.93it/s]

Training_loss 2.87894,   Relative Error 0.65008
Training_loss 2.87284,   Relative Error 0.64937


 18%|█▊        | 358/2000 [00:35<04:19,  6.32it/s]

Training_loss 2.86786,   Relative Error 0.64880
Training_loss 2.85655,   Relative Error 0.64751


 18%|█▊        | 360/2000 [00:36<03:52,  7.07it/s]

Training_loss 2.84378,   Relative Error 0.64607
Training_loss 2.83561,   Relative Error 0.64514


 18%|█▊        | 362/2000 [00:36<03:33,  7.68it/s]

Training_loss 2.82818,   Relative Error 0.64430
Training_loss 2.82204,   Relative Error 0.64361
Training_loss 2.80856,   Relative Error 0.64207


 18%|█▊        | 365/2000 [00:36<03:23,  8.02it/s]

Training_loss 2.80143,   Relative Error 0.64125
Training_loss 2.79848,   Relative Error 0.64090
Training_loss 2.78893,   Relative Error 0.63984


 18%|█▊        | 369/2000 [00:36<02:41, 10.09it/s]

Training_loss 2.78328,   Relative Error 0.63920
Training_loss 2.77830,   Relative Error 0.63866
Training_loss 2.77289,   Relative Error 0.63808


 19%|█▊        | 372/2000 [00:37<02:50,  9.55it/s]

Training_loss 2.76835,   Relative Error 0.63755
Training_loss 2.75664,   Relative Error 0.63618
Training_loss 2.74914,   Relative Error 0.63534


 19%|█▊        | 374/2000 [00:37<02:41, 10.07it/s]

Training_loss 2.74554,   Relative Error 0.63495
Training_loss 2.73940,   Relative Error 0.63426
Training_loss 2.72892,   Relative Error 0.63306


 19%|█▉        | 378/2000 [00:37<02:30, 10.81it/s]

Training_loss 2.72252,   Relative Error 0.63232
Training_loss 2.71582,   Relative Error 0.63155
Training_loss 2.70728,   Relative Error 0.63055


 19%|█▉        | 380/2000 [00:38<02:39, 10.17it/s]

Training_loss 2.70074,   Relative Error 0.62979
Training_loss 2.69702,   Relative Error 0.62934


 19%|█▉        | 382/2000 [00:38<02:37, 10.26it/s]

Training_loss 2.69672,   Relative Error 0.62931
Training_loss 2.68907,   Relative Error 0.62841
Training_loss 2.68136,   Relative Error 0.62747


 19%|█▉        | 386/2000 [00:38<02:31, 10.66it/s]

Training_loss 2.67144,   Relative Error 0.62631
Training_loss 2.66376,   Relative Error 0.62543
Training_loss 2.65922,   Relative Error 0.62489


 19%|█▉        | 388/2000 [00:38<02:31, 10.67it/s]

Training_loss 2.65006,   Relative Error 0.62380
Training_loss 2.64353,   Relative Error 0.62305
Training_loss 2.62901,   Relative Error 0.62137


 20%|█▉        | 392/2000 [00:39<02:24, 11.15it/s]

Training_loss 2.62708,   Relative Error 0.62112
Training_loss 2.61941,   Relative Error 0.62019
Training_loss 2.61652,   Relative Error 0.61984


 20%|█▉        | 394/2000 [00:39<02:25, 11.01it/s]

Training_loss 2.60656,   Relative Error 0.61867
Training_loss 2.60284,   Relative Error 0.61823
Training_loss 2.60014,   Relative Error 0.61793


 20%|█▉        | 398/2000 [00:39<02:21, 11.34it/s]

Training_loss 2.59091,   Relative Error 0.61683
Training_loss 2.58680,   Relative Error 0.61633
Training_loss 2.58292,   Relative Error 0.61587


 20%|██        | 400/2000 [00:39<02:24, 11.05it/s]

Training_loss 2.58144,   Relative Error 0.61568
Training_loss 2.57516,   Relative Error 0.61494
Training_loss 2.56575,   Relative Error 0.61381


 20%|██        | 404/2000 [00:40<02:21, 11.26it/s]

Training_loss 2.55930,   Relative Error 0.61301
Training_loss 2.55011,   Relative Error 0.61193
Training_loss 2.54477,   Relative Error 0.61132


 20%|██        | 406/2000 [00:40<02:19, 11.39it/s]

Training_loss 2.53632,   Relative Error 0.61030
Training_loss 2.53038,   Relative Error 0.60957
Training_loss 2.52169,   Relative Error 0.60851


 20%|██        | 410/2000 [00:40<02:17, 11.58it/s]

Training_loss 2.51648,   Relative Error 0.60790
Training_loss 2.51519,   Relative Error 0.60775
Training_loss 2.50648,   Relative Error 0.60670


 21%|██        | 412/2000 [00:40<02:15, 11.69it/s]

Training_loss 2.50228,   Relative Error 0.60618
Training_loss 2.49824,   Relative Error 0.60569
Training_loss 2.49197,   Relative Error 0.60492


 21%|██        | 416/2000 [00:41<02:12, 12.00it/s]

Training_loss 2.49085,   Relative Error 0.60478
Training_loss 2.48180,   Relative Error 0.60364
Training_loss 2.46874,   Relative Error 0.60207


 21%|██        | 418/2000 [00:41<02:18, 11.42it/s]

Training_loss 2.46548,   Relative Error 0.60171
Training_loss 2.45491,   Relative Error 0.60041
Training_loss 2.44776,   Relative Error 0.59954


 21%|██        | 422/2000 [00:41<02:16, 11.52it/s]

Training_loss 2.43680,   Relative Error 0.59826
Training_loss 2.43196,   Relative Error 0.59768
Training_loss 2.42462,   Relative Error 0.59675


 21%|██        | 424/2000 [00:41<02:17, 11.45it/s]

Training_loss 2.42066,   Relative Error 0.59624
Training_loss 2.41228,   Relative Error 0.59517
Training_loss 2.40239,   Relative Error 0.59396


 21%|██▏       | 428/2000 [00:42<02:13, 11.81it/s]

Training_loss 2.40029,   Relative Error 0.59371
Training_loss 2.39457,   Relative Error 0.59298
Training_loss 2.39094,   Relative Error 0.59255


 22%|██▏       | 430/2000 [00:42<02:13, 11.73it/s]

Training_loss 2.38744,   Relative Error 0.59212
Training_loss 2.37805,   Relative Error 0.59092
Training_loss 2.37377,   Relative Error 0.59040


 22%|██▏       | 434/2000 [00:42<02:15, 11.54it/s]

Training_loss 2.36393,   Relative Error 0.58919
Training_loss 2.35392,   Relative Error 0.58797
Training_loss 2.34927,   Relative Error 0.58736


 22%|██▏       | 436/2000 [00:42<02:14, 11.67it/s]

Training_loss 2.34265,   Relative Error 0.58651
Training_loss 2.33869,   Relative Error 0.58602


 22%|██▏       | 438/2000 [00:43<02:30, 10.36it/s]

Training_loss 2.33439,   Relative Error 0.58548
Training_loss 2.32941,   Relative Error 0.58485
Training_loss 2.32400,   Relative Error 0.58418


 22%|██▏       | 440/2000 [00:43<02:26, 10.63it/s]

Training_loss 2.32264,   Relative Error 0.58400
Training_loss 2.31366,   Relative Error 0.58289


 22%|██▏       | 444/2000 [00:43<02:22, 10.91it/s]

Training_loss 2.31021,   Relative Error 0.58246
Training_loss 2.30200,   Relative Error 0.58141
Training_loss 2.29352,   Relative Error 0.58034


 22%|██▏       | 446/2000 [00:43<02:17, 11.34it/s]

Training_loss 2.29054,   Relative Error 0.57998
Training_loss 2.28619,   Relative Error 0.57941
Training_loss 2.28312,   Relative Error 0.57902


 22%|██▎       | 450/2000 [00:44<02:12, 11.66it/s]

Training_loss 2.27735,   Relative Error 0.57827
Training_loss 2.27177,   Relative Error 0.57758
Training_loss 2.26848,   Relative Error 0.57715


 23%|██▎       | 452/2000 [00:44<02:13, 11.62it/s]

Training_loss 2.26622,   Relative Error 0.57687
Training_loss 2.26123,   Relative Error 0.57620
Training_loss 2.25594,   Relative Error 0.57553


 23%|██▎       | 454/2000 [00:44<02:23, 10.79it/s]

Training_loss 2.24786,   Relative Error 0.57446
Training_loss 2.24354,   Relative Error 0.57391


 23%|██▎       | 456/2000 [00:44<02:26, 10.51it/s]

Training_loss 2.23966,   Relative Error 0.57342
Training_loss 2.23450,   Relative Error 0.57276


 23%|██▎       | 460/2000 [00:45<02:30, 10.20it/s]

Training_loss 2.22734,   Relative Error 0.57181
Training_loss 2.21915,   Relative Error 0.57077
Training_loss 2.21317,   Relative Error 0.57000


 23%|██▎       | 462/2000 [00:45<02:27, 10.42it/s]

Training_loss 2.20489,   Relative Error 0.56891
Training_loss 2.19737,   Relative Error 0.56792
Training_loss 2.18765,   Relative Error 0.56668


 23%|██▎       | 466/2000 [00:45<02:25, 10.54it/s]

Training_loss 2.17748,   Relative Error 0.56540
Training_loss 2.17048,   Relative Error 0.56449
Training_loss 2.16728,   Relative Error 0.56409


 23%|██▎       | 468/2000 [00:46<02:30, 10.19it/s]

Training_loss 2.16386,   Relative Error 0.56364
Training_loss 2.15661,   Relative Error 0.56268


 24%|██▎       | 470/2000 [00:46<02:28, 10.29it/s]

Training_loss 2.15195,   Relative Error 0.56209
Training_loss 2.14270,   Relative Error 0.56088
Training_loss 2.13616,   Relative Error 0.56006


 24%|██▎       | 474/2000 [00:46<02:19, 10.92it/s]

Training_loss 2.13312,   Relative Error 0.55965
Training_loss 2.12935,   Relative Error 0.55913
Training_loss 2.12797,   Relative Error 0.55895


 24%|██▍       | 476/2000 [00:46<02:16, 11.20it/s]

Training_loss 2.12340,   Relative Error 0.55834
Training_loss 2.11478,   Relative Error 0.55722
Training_loss 2.10794,   Relative Error 0.55635


 24%|██▍       | 480/2000 [00:47<02:12, 11.43it/s]

Training_loss 2.10486,   Relative Error 0.55595
Training_loss 2.10228,   Relative Error 0.55562
Training_loss 2.09975,   Relative Error 0.55530


 24%|██▍       | 482/2000 [00:47<02:15, 11.17it/s]

Training_loss 2.09610,   Relative Error 0.55482
Training_loss 2.09187,   Relative Error 0.55426
Training_loss 2.08658,   Relative Error 0.55354


 24%|██▍       | 486/2000 [00:47<02:10, 11.56it/s]

Training_loss 2.07983,   Relative Error 0.55263
Training_loss 2.07787,   Relative Error 0.55239
Training_loss 2.07365,   Relative Error 0.55181


 24%|██▍       | 488/2000 [00:47<02:13, 11.33it/s]

Training_loss 2.07248,   Relative Error 0.55165
Training_loss 2.07065,   Relative Error 0.55140
Training_loss 2.06698,   Relative Error 0.55092


 24%|██▍       | 490/2000 [00:47<02:09, 11.66it/s]

Training_loss 2.06243,   Relative Error 0.55032


 25%|██▍       | 492/2000 [00:48<03:00,  8.36it/s]

Training_loss 2.06041,   Relative Error 0.55003
Training_loss 2.05418,   Relative Error 0.54920
Training_loss 2.04680,   Relative Error 0.54821


 25%|██▍       | 496/2000 [00:48<02:34,  9.72it/s]

Training_loss 2.04564,   Relative Error 0.54805
Training_loss 2.03846,   Relative Error 0.54709
Training_loss 2.03125,   Relative Error 0.54611


 25%|██▍       | 498/2000 [00:48<02:25, 10.33it/s]

Training_loss 2.02711,   Relative Error 0.54556
Training_loss 2.02485,   Relative Error 0.54526
Training_loss 2.02327,   Relative Error 0.54504


 25%|██▌       | 502/2000 [00:49<02:13, 11.20it/s]

Training_loss 2.01972,   Relative Error 0.54454
Training_loss 2.01109,   Relative Error 0.54342
Training_loss 2.00685,   Relative Error 0.54284


 25%|██▌       | 504/2000 [00:49<02:10, 11.44it/s]

Training_loss 2.00431,   Relative Error 0.54248
Training_loss 2.00254,   Relative Error 0.54221
Training_loss 1.99544,   Relative Error 0.54128


 25%|██▌       | 508/2000 [00:49<02:01, 12.31it/s]

Training_loss 1.99421,   Relative Error 0.54107
Training_loss 1.99175,   Relative Error 0.54075
Training_loss 1.98665,   Relative Error 0.54006


 26%|██▌       | 510/2000 [00:49<02:05, 11.84it/s]

Training_loss 1.98189,   Relative Error 0.53939
Training_loss 1.97920,   Relative Error 0.53904
Training_loss 1.97692,   Relative Error 0.53875


 26%|██▌       | 514/2000 [00:50<02:11, 11.28it/s]

Training_loss 1.97333,   Relative Error 0.53823
Training_loss 1.97151,   Relative Error 0.53798
Training_loss 1.96447,   Relative Error 0.53704


 26%|██▌       | 516/2000 [00:50<02:12, 11.24it/s]

Training_loss 1.96248,   Relative Error 0.53677
Training_loss 1.95877,   Relative Error 0.53626
Training_loss 1.95481,   Relative Error 0.53574


 26%|██▌       | 520/2000 [00:50<02:03, 12.01it/s]

Training_loss 1.95111,   Relative Error 0.53523
Training_loss 1.94626,   Relative Error 0.53456
Training_loss 1.94204,   Relative Error 0.53398


 26%|██▌       | 522/2000 [00:50<02:11, 11.26it/s]

Training_loss 1.93826,   Relative Error 0.53347
Training_loss 1.93648,   Relative Error 0.53320
Training_loss 1.92910,   Relative Error 0.53223


 26%|██▋       | 526/2000 [00:51<02:08, 11.43it/s]

Training_loss 1.92805,   Relative Error 0.53207
Training_loss 1.92081,   Relative Error 0.53107
Training_loss 1.91861,   Relative Error 0.53078


 26%|██▋       | 528/2000 [00:51<02:03, 11.92it/s]

Training_loss 1.91123,   Relative Error 0.52979
Training_loss 1.91021,   Relative Error 0.52963
Training_loss 1.90753,   Relative Error 0.52928


 26%|██▋       | 530/2000 [00:51<02:13, 11.04it/s]

Training_loss 1.90202,   Relative Error 0.52853
Training_loss 1.90128,   Relative Error 0.52843


 27%|██▋       | 532/2000 [00:51<02:24, 10.16it/s]

Training_loss 1.89980,   Relative Error 0.52822
Training_loss 1.89825,   Relative Error 0.52801


 27%|██▋       | 535/2000 [00:52<02:53,  8.44it/s]

Training_loss 1.89231,   Relative Error 0.52718
Training_loss 1.88890,   Relative Error 0.52673


 27%|██▋       | 537/2000 [00:52<03:00,  8.12it/s]

Training_loss 1.88290,   Relative Error 0.52592
Training_loss 1.87979,   Relative Error 0.52548


 27%|██▋       | 539/2000 [00:52<02:37,  9.29it/s]

Training_loss 1.87490,   Relative Error 0.52479
Training_loss 1.86673,   Relative Error 0.52364
Training_loss 1.86527,   Relative Error 0.52341


 27%|██▋       | 543/2000 [00:53<02:15, 10.79it/s]

Training_loss 1.86234,   Relative Error 0.52300
Training_loss 1.85554,   Relative Error 0.52205
Training_loss 1.85340,   Relative Error 0.52175


 27%|██▋       | 545/2000 [00:53<02:12, 10.99it/s]

Training_loss 1.84975,   Relative Error 0.52125
Training_loss 1.84774,   Relative Error 0.52099
Training_loss 1.84531,   Relative Error 0.52066


 27%|██▋       | 549/2000 [00:53<02:01, 11.93it/s]

Training_loss 1.84173,   Relative Error 0.52018
Training_loss 1.83896,   Relative Error 0.51978
Training_loss 1.83790,   Relative Error 0.51962


 28%|██▊       | 551/2000 [00:53<01:59, 12.08it/s]

Training_loss 1.83293,   Relative Error 0.51888
Training_loss 1.82871,   Relative Error 0.51828
Training_loss 1.82815,   Relative Error 0.51822


 28%|██▊       | 555/2000 [00:54<01:56, 12.44it/s]

Training_loss 1.82342,   Relative Error 0.51755
Training_loss 1.82059,   Relative Error 0.51712
Training_loss 1.81665,   Relative Error 0.51657


 28%|██▊       | 557/2000 [00:54<02:01, 11.85it/s]

Training_loss 1.81415,   Relative Error 0.51621
Training_loss 1.80684,   Relative Error 0.51519
Training_loss 1.80600,   Relative Error 0.51506


 28%|██▊       | 561/2000 [00:54<01:56, 12.37it/s]

Training_loss 1.79926,   Relative Error 0.51410
Training_loss 1.79790,   Relative Error 0.51391
Training_loss 1.79259,   Relative Error 0.51318


 28%|██▊       | 563/2000 [00:54<01:55, 12.47it/s]

Training_loss 1.79062,   Relative Error 0.51289
Training_loss 1.79107,   Relative Error 0.51296
Training_loss 1.79032,   Relative Error 0.51284


 28%|██▊       | 567/2000 [00:54<01:54, 12.47it/s]

Training_loss 1.78485,   Relative Error 0.51208
Training_loss 1.78205,   Relative Error 0.51168
Training_loss 1.77954,   Relative Error 0.51134


 28%|██▊       | 569/2000 [00:55<01:55, 12.44it/s]

Training_loss 1.77835,   Relative Error 0.51115
Training_loss 1.77066,   Relative Error 0.51002
Training_loss 1.76847,   Relative Error 0.50975


 29%|██▊       | 573/2000 [00:55<02:17, 10.41it/s]

Training_loss 1.76183,   Relative Error 0.50879
Training_loss 1.75591,   Relative Error 0.50795
Training_loss 1.75139,   Relative Error 0.50731


 29%|██▉       | 575/2000 [00:55<02:10, 10.90it/s]

Training_loss 1.74963,   Relative Error 0.50706
Training_loss 1.74571,   Relative Error 0.50649
Training_loss 1.74120,   Relative Error 0.50585


 29%|██▉       | 579/2000 [00:56<02:03, 11.47it/s]

Training_loss 1.74012,   Relative Error 0.50570
Training_loss 1.73771,   Relative Error 0.50535
Training_loss 1.73495,   Relative Error 0.50497


 29%|██▉       | 581/2000 [00:56<02:11, 10.76it/s]

Training_loss 1.73392,   Relative Error 0.50480
Training_loss 1.72860,   Relative Error 0.50404
Training_loss 1.72749,   Relative Error 0.50388


 29%|██▉       | 583/2000 [00:56<02:05, 11.25it/s]

Training_loss 1.72597,   Relative Error 0.50367
Training_loss 1.72321,   Relative Error 0.50327


 29%|██▉       | 587/2000 [00:56<02:25,  9.69it/s]

Training_loss 1.71833,   Relative Error 0.50256
Training_loss 1.71526,   Relative Error 0.50212
Training_loss 1.71163,   Relative Error 0.50160


 29%|██▉       | 589/2000 [00:57<02:36,  9.03it/s]

Training_loss 1.71218,   Relative Error 0.50168
Training_loss 1.71056,   Relative Error 0.50145


 30%|██▉       | 592/2000 [00:57<02:26,  9.61it/s]

Training_loss 1.70632,   Relative Error 0.50080
Training_loss 1.70264,   Relative Error 0.50025
Training_loss 1.69800,   Relative Error 0.49956


 30%|██▉       | 594/2000 [00:57<02:22,  9.86it/s]

Training_loss 1.69936,   Relative Error 0.49975
Training_loss 1.69448,   Relative Error 0.49905
Training_loss 1.69232,   Relative Error 0.49872


 30%|██▉       | 596/2000 [00:57<02:15, 10.37it/s]

Training_loss 1.68863,   Relative Error 0.49819
Training_loss 1.68660,   Relative Error 0.49789


 30%|██▉       | 598/2000 [00:58<02:20, 10.00it/s]

Training_loss 1.68546,   Relative Error 0.49770
Training_loss 1.68236,   Relative Error 0.49723


 30%|███       | 601/2000 [00:58<03:59,  5.83it/s]

Training_loss 1.67706,   Relative Error 0.49644
Training_loss 1.67233,   Relative Error 0.49574


 30%|███       | 603/2000 [00:59<03:19,  6.99it/s]

Training_loss 1.67033,   Relative Error 0.49544
Training_loss 1.66683,   Relative Error 0.49494
Training_loss 1.66398,   Relative Error 0.49453


 30%|███       | 607/2000 [00:59<02:35,  8.94it/s]

Training_loss 1.66169,   Relative Error 0.49420
Training_loss 1.66106,   Relative Error 0.49409
Training_loss 1.66019,   Relative Error 0.49398


 30%|███       | 609/2000 [00:59<02:28,  9.34it/s]

Training_loss 1.65889,   Relative Error 0.49378
Training_loss 1.65837,   Relative Error 0.49368


 31%|███       | 611/2000 [00:59<02:27,  9.45it/s]

Training_loss 1.65526,   Relative Error 0.49323
Training_loss 1.65492,   Relative Error 0.49318
Training_loss 1.65062,   Relative Error 0.49254


 31%|███       | 615/2000 [01:00<02:11, 10.51it/s]

Training_loss 1.65030,   Relative Error 0.49250
Training_loss 1.64849,   Relative Error 0.49224
Training_loss 1.64240,   Relative Error 0.49133


 31%|███       | 617/2000 [01:00<02:08, 10.72it/s]

Training_loss 1.63990,   Relative Error 0.49096
Training_loss 1.63496,   Relative Error 0.49023
Training_loss 1.62867,   Relative Error 0.48930


 31%|███       | 621/2000 [01:00<02:01, 11.32it/s]

Training_loss 1.62562,   Relative Error 0.48883
Training_loss 1.62313,   Relative Error 0.48846
Training_loss 1.62283,   Relative Error 0.48841


 31%|███       | 623/2000 [01:00<02:09, 10.65it/s]

Training_loss 1.62229,   Relative Error 0.48834
Training_loss 1.62110,   Relative Error 0.48818
Training_loss 1.61870,   Relative Error 0.48779


 31%|███▏      | 627/2000 [01:01<02:03, 11.08it/s]

Training_loss 1.61586,   Relative Error 0.48736
Training_loss 1.61361,   Relative Error 0.48702
Training_loss 1.61358,   Relative Error 0.48704
Training_loss 1.61317,   Relative Error 0.48698


 31%|███▏      | 629/2000 [01:01<02:47,  8.19it/s]

Training_loss 1.61315,   Relative Error 0.48697


 32%|███▏      | 631/2000 [01:02<03:41,  6.18it/s]

Training_loss 1.61240,   Relative Error 0.48688
Training_loss 1.61202,   Relative Error 0.48682


 32%|███▏      | 633/2000 [01:02<03:17,  6.92it/s]

Training_loss 1.61018,   Relative Error 0.48651
Training_loss 1.60643,   Relative Error 0.48597


 32%|███▏      | 634/2000 [01:02<03:26,  6.62it/s]

Training_loss 1.60601,   Relative Error 0.48588
Training_loss 1.60327,   Relative Error 0.48546

 32%|███▏      | 635/2000 [01:02<03:42,  6.14it/s]




 32%|███▏      | 636/2000 [01:03<04:36,  4.94it/s]

Training_loss 1.60054,   Relative Error 0.48506


 32%|███▏      | 637/2000 [01:03<04:52,  4.66it/s]

Training_loss 1.59956,   Relative Error 0.48491
Training_loss 1.59747,   Relative Error 0.48460


 32%|███▏      | 639/2000 [01:03<03:52,  5.86it/s]

Training_loss 1.59764,   Relative Error 0.48463


 32%|███▏      | 640/2000 [01:03<04:13,  5.36it/s]

Training_loss 1.59702,   Relative Error 0.48454


 32%|███▏      | 642/2000 [01:04<04:14,  5.34it/s]

Training_loss 1.59302,   Relative Error 0.48392
Training_loss 1.59296,   Relative Error 0.48390


 32%|███▏      | 643/2000 [01:04<04:47,  4.71it/s]

Training_loss 1.59167,   Relative Error 0.48369


 32%|███▏      | 644/2000 [01:04<05:28,  4.13it/s]

Training_loss 1.59100,   Relative Error 0.48359


 32%|███▏      | 645/2000 [01:05<05:26,  4.15it/s]

Training_loss 1.58943,   Relative Error 0.48334
Training_loss 1.58693,   Relative Error 0.48296


 32%|███▏      | 648/2000 [01:05<04:17,  5.24it/s]

Training_loss 1.58601,   Relative Error 0.48281
Training_loss 1.58307,   Relative Error 0.48236


 32%|███▎      | 650/2000 [01:05<03:35,  6.27it/s]

Training_loss 1.57816,   Relative Error 0.48164
Training_loss 1.57329,   Relative Error 0.48091


 33%|███▎      | 652/2000 [01:06<03:23,  6.61it/s]

Training_loss 1.56960,   Relative Error 0.48037
Training_loss 1.57028,   Relative Error 0.48047


 33%|███▎      | 654/2000 [01:06<03:12,  6.98it/s]

Training_loss 1.56613,   Relative Error 0.47985
Training_loss 1.56534,   Relative Error 0.47976


 33%|███▎      | 656/2000 [01:06<03:31,  6.37it/s]

Training_loss 1.56163,   Relative Error 0.47921
Training_loss 1.55969,   Relative Error 0.47891


 33%|███▎      | 658/2000 [01:06<03:10,  7.05it/s]

Training_loss 1.55874,   Relative Error 0.47875
Training_loss 1.55794,   Relative Error 0.47863


 33%|███▎      | 660/2000 [01:07<02:35,  8.59it/s]

Training_loss 1.55628,   Relative Error 0.47838
Training_loss 1.55448,   Relative Error 0.47811
Training_loss 1.55597,   Relative Error 0.47833


 33%|███▎      | 663/2000 [01:07<02:21,  9.44it/s]

Training_loss 1.55474,   Relative Error 0.47815
Training_loss 1.55332,   Relative Error 0.47794


 33%|███▎      | 665/2000 [01:07<02:43,  8.19it/s]

Training_loss 1.55195,   Relative Error 0.47773
Training_loss 1.54900,   Relative Error 0.47731


 33%|███▎      | 668/2000 [01:07<02:19,  9.58it/s]

Training_loss 1.54474,   Relative Error 0.47663
Training_loss 1.54379,   Relative Error 0.47649
Training_loss 1.54093,   Relative Error 0.47604


 34%|███▎      | 670/2000 [01:08<02:38,  8.40it/s]

Training_loss 1.53847,   Relative Error 0.47565
Training_loss 1.53781,   Relative Error 0.47556


 34%|███▎      | 672/2000 [01:08<02:52,  7.70it/s]

Training_loss 1.53654,   Relative Error 0.47538
Training_loss 1.53210,   Relative Error 0.47469


 34%|███▎      | 674/2000 [01:08<02:58,  7.44it/s]

Training_loss 1.53240,   Relative Error 0.47473
Training_loss 1.53340,   Relative Error 0.47489


 34%|███▍      | 676/2000 [01:09<02:37,  8.42it/s]

Training_loss 1.53149,   Relative Error 0.47459
Training_loss 1.53272,   Relative Error 0.47477


 34%|███▍      | 678/2000 [01:09<02:34,  8.58it/s]

Training_loss 1.52856,   Relative Error 0.47413
Training_loss 1.52835,   Relative Error 0.47411


 34%|███▍      | 680/2000 [01:09<02:25,  9.05it/s]

Training_loss 1.52779,   Relative Error 0.47403
Training_loss 1.52607,   Relative Error 0.47374


 34%|███▍      | 682/2000 [01:09<02:55,  7.52it/s]

Training_loss 1.52564,   Relative Error 0.47368
Training_loss 1.52242,   Relative Error 0.47319


 34%|███▍      | 684/2000 [01:09<02:50,  7.72it/s]

Training_loss 1.52358,   Relative Error 0.47336
Training_loss 1.52263,   Relative Error 0.47320


 34%|███▍      | 686/2000 [01:10<02:21,  9.26it/s]

Training_loss 1.52235,   Relative Error 0.47315
Training_loss 1.52137,   Relative Error 0.47300
Training_loss 1.52031,   Relative Error 0.47284


 34%|███▍      | 690/2000 [01:10<01:57, 11.15it/s]

Training_loss 1.51589,   Relative Error 0.47215
Training_loss 1.51511,   Relative Error 0.47203
Training_loss 1.51228,   Relative Error 0.47161


 35%|███▍      | 692/2000 [01:10<01:55, 11.33it/s]

Training_loss 1.51118,   Relative Error 0.47142
Training_loss 1.51028,   Relative Error 0.47126
Training_loss 1.50586,   Relative Error 0.47057


 35%|███▍      | 696/2000 [01:10<01:51, 11.67it/s]

Training_loss 1.50259,   Relative Error 0.47005
Training_loss 1.49925,   Relative Error 0.46952
Training_loss 1.49803,   Relative Error 0.46933


 35%|███▍      | 698/2000 [01:11<01:48, 11.95it/s]

Training_loss 1.49377,   Relative Error 0.46866
Training_loss 1.49086,   Relative Error 0.46821
Training_loss 1.48908,   Relative Error 0.46792


 35%|███▌      | 702/2000 [01:11<01:48, 11.98it/s]

Training_loss 1.48650,   Relative Error 0.46750
Training_loss 1.48636,   Relative Error 0.46749
Training_loss 1.48392,   Relative Error 0.46710


 35%|███▌      | 704/2000 [01:11<01:52, 11.56it/s]

Training_loss 1.48405,   Relative Error 0.46713
Training_loss 1.48308,   Relative Error 0.46700


 35%|███▌      | 706/2000 [01:11<02:09,  9.96it/s]

Training_loss 1.48322,   Relative Error 0.46702
Training_loss 1.47907,   Relative Error 0.46637
Training_loss 1.47601,   Relative Error 0.46588


 36%|███▌      | 710/2000 [01:12<02:00, 10.74it/s]

Training_loss 1.47477,   Relative Error 0.46566
Training_loss 1.47345,   Relative Error 0.46544
Training_loss 1.47396,   Relative Error 0.46552


 36%|███▌      | 712/2000 [01:12<01:59, 10.75it/s]

Training_loss 1.47198,   Relative Error 0.46522
Training_loss 1.47064,   Relative Error 0.46500
Training_loss 1.46830,   Relative Error 0.46463


 36%|███▌      | 716/2000 [01:12<01:56, 11.05it/s]

Training_loss 1.46460,   Relative Error 0.46403
Training_loss 1.46463,   Relative Error 0.46403
Training_loss 1.46307,   Relative Error 0.46379


 36%|███▌      | 718/2000 [01:12<01:52, 11.44it/s]

Training_loss 1.46085,   Relative Error 0.46343
Training_loss 1.45936,   Relative Error 0.46319
Training_loss 1.46019,   Relative Error 0.46331


 36%|███▌      | 720/2000 [01:13<01:48, 11.77it/s]

Training_loss 1.45650,   Relative Error 0.46273
Training_loss 1.45620,   Relative Error 0.46267


 36%|███▌      | 724/2000 [01:13<02:07, 10.03it/s]

Training_loss 1.45734,   Relative Error 0.46284
Training_loss 1.45345,   Relative Error 0.46224
Training_loss 1.45281,   Relative Error 0.46213
Training_loss 1.45052,   Relative Error 0.46176
Training_loss 1.44839,   Relative Error 0.46143


 36%|███▋      | 728/2000 [01:14<02:51,  7.42it/s]

Training_loss 1.44746,   Relative Error 0.46129
Training_loss 1.44729,   Relative Error 0.46128
Training_loss 1.44637,   Relative Error 0.46113


 37%|███▋      | 732/2000 [01:14<02:09,  9.82it/s]

Training_loss 1.44274,   Relative Error 0.46055
Training_loss 1.44045,   Relative Error 0.46020
Training_loss 1.44034,   Relative Error 0.46018


 37%|███▋      | 734/2000 [01:14<02:10,  9.67it/s]

Training_loss 1.44138,   Relative Error 0.46033
Training_loss 1.44247,   Relative Error 0.46050


 37%|███▋      | 736/2000 [01:14<02:09,  9.75it/s]

Training_loss 1.44236,   Relative Error 0.46047
Training_loss 1.44335,   Relative Error 0.46062
Training_loss 1.44143,   Relative Error 0.46033


 37%|███▋      | 740/2000 [01:15<01:55, 10.87it/s]

Training_loss 1.43935,   Relative Error 0.45998
Training_loss 1.44065,   Relative Error 0.46019
Training_loss 1.44044,   Relative Error 0.46016


 37%|███▋      | 742/2000 [01:15<02:28,  8.45it/s]

Training_loss 1.43850,   Relative Error 0.45985
Training_loss 1.43880,   Relative Error 0.45990


 37%|███▋      | 744/2000 [01:15<02:43,  7.68it/s]

Training_loss 1.43782,   Relative Error 0.45974
Training_loss 1.43669,   Relative Error 0.45957


 37%|███▋      | 747/2000 [01:16<02:25,  8.63it/s]

Training_loss 1.43573,   Relative Error 0.45942
Training_loss 1.43537,   Relative Error 0.45935
Training_loss 1.43465,   Relative Error 0.45923


 37%|███▋      | 749/2000 [01:16<02:08,  9.76it/s]

Training_loss 1.43547,   Relative Error 0.45936
Training_loss 1.43582,   Relative Error 0.45942
Training_loss 1.43224,   Relative Error 0.45885


 38%|███▊      | 753/2000 [01:16<01:54, 10.93it/s]

Training_loss 1.43166,   Relative Error 0.45875
Training_loss 1.43288,   Relative Error 0.45894
Training_loss 1.43282,   Relative Error 0.45895


 38%|███▊      | 755/2000 [01:16<01:50, 11.24it/s]

Training_loss 1.43414,   Relative Error 0.45914
Training_loss 1.43365,   Relative Error 0.45906
Training_loss 1.43379,   Relative Error 0.45908


 38%|███▊      | 759/2000 [01:17<01:45, 11.76it/s]

Training_loss 1.43010,   Relative Error 0.45848
Training_loss 1.43148,   Relative Error 0.45870
Training_loss 1.43069,   Relative Error 0.45857


 38%|███▊      | 761/2000 [01:17<01:50, 11.20it/s]

Training_loss 1.42966,   Relative Error 0.45842
Training_loss 1.42677,   Relative Error 0.45794


 38%|███▊      | 763/2000 [01:17<01:54, 10.79it/s]

Training_loss 1.42677,   Relative Error 0.45794
Training_loss 1.42612,   Relative Error 0.45784
Training_loss 1.42584,   Relative Error 0.45778


 38%|███▊      | 767/2000 [01:18<01:53, 10.88it/s]

Training_loss 1.42540,   Relative Error 0.45770
Training_loss 1.42515,   Relative Error 0.45767
Training_loss 1.42156,   Relative Error 0.45709


 38%|███▊      | 769/2000 [01:18<01:55, 10.67it/s]

Training_loss 1.41874,   Relative Error 0.45663
Training_loss 1.41972,   Relative Error 0.45679
Training_loss 1.41680,   Relative Error 0.45631


 39%|███▊      | 773/2000 [01:18<01:51, 10.98it/s]

Training_loss 1.41671,   Relative Error 0.45631
Training_loss 1.41578,   Relative Error 0.45614
Training_loss 1.41496,   Relative Error 0.45601


 39%|███▉      | 775/2000 [01:18<01:47, 11.38it/s]

Training_loss 1.41153,   Relative Error 0.45547
Training_loss 1.40914,   Relative Error 0.45510
Training_loss 1.40927,   Relative Error 0.45511


 39%|███▉      | 779/2000 [01:19<01:38, 12.43it/s]

Training_loss 1.40838,   Relative Error 0.45495
Training_loss 1.41005,   Relative Error 0.45524
Training_loss 1.41010,   Relative Error 0.45525


 39%|███▉      | 781/2000 [01:19<01:37, 12.50it/s]

Training_loss 1.40956,   Relative Error 0.45518
Training_loss 1.40916,   Relative Error 0.45512
Training_loss 1.40879,   Relative Error 0.45505


 39%|███▉      | 783/2000 [01:19<01:37, 12.50it/s]

Training_loss 1.40935,   Relative Error 0.45513
Training_loss 1.41043,   Relative Error 0.45530


 39%|███▉      | 787/2000 [01:19<01:56, 10.44it/s]

Training_loss 1.40714,   Relative Error 0.45479
Training_loss 1.40905,   Relative Error 0.45509
Training_loss 1.40930,   Relative Error 0.45513


 39%|███▉      | 789/2000 [01:20<02:05,  9.68it/s]

Training_loss 1.40934,   Relative Error 0.45515
Training_loss 1.40936,   Relative Error 0.45516


 40%|███▉      | 791/2000 [01:20<01:58, 10.16it/s]

Training_loss 1.40820,   Relative Error 0.45498
Training_loss 1.40822,   Relative Error 0.45498
Training_loss 1.40769,   Relative Error 0.45489


 40%|███▉      | 793/2000 [01:20<01:58, 10.19it/s]

Training_loss 1.40792,   Relative Error 0.45492
Training_loss 1.40877,   Relative Error 0.45506


 40%|███▉      | 796/2000 [01:20<02:14,  8.93it/s]

Training_loss 1.40923,   Relative Error 0.45513
Training_loss 1.40589,   Relative Error 0.45460


 40%|███▉      | 799/2000 [01:21<02:00,  9.95it/s]

Training_loss 1.40593,   Relative Error 0.45460
Training_loss 1.40637,   Relative Error 0.45467
Training_loss 1.40270,   Relative Error 0.45409


 40%|████      | 801/2000 [01:21<01:50, 10.86it/s]

Training_loss 1.40342,   Relative Error 0.45421
Training_loss 1.40221,   Relative Error 0.45400
Training_loss 1.40063,   Relative Error 0.45374


 40%|████      | 805/2000 [01:21<01:39, 11.96it/s]

Training_loss 1.39808,   Relative Error 0.45331
Training_loss 1.39813,   Relative Error 0.45332
Training_loss 1.39934,   Relative Error 0.45350


 40%|████      | 807/2000 [01:21<01:39, 12.05it/s]

Training_loss 1.39965,   Relative Error 0.45358
Training_loss 1.39709,   Relative Error 0.45316
Training_loss 1.39753,   Relative Error 0.45323


 41%|████      | 811/2000 [01:22<01:36, 12.31it/s]

Training_loss 1.39740,   Relative Error 0.45320
Training_loss 1.39736,   Relative Error 0.45318
Training_loss 1.39414,   Relative Error 0.45265


 41%|████      | 813/2000 [01:22<01:36, 12.24it/s]

Training_loss 1.39267,   Relative Error 0.45242
Training_loss 1.39216,   Relative Error 0.45233
Training_loss 1.39241,   Relative Error 0.45237


 41%|████      | 817/2000 [01:22<01:34, 12.47it/s]

Training_loss 1.38985,   Relative Error 0.45196
Training_loss 1.38925,   Relative Error 0.45186
Training_loss 1.38774,   Relative Error 0.45160


 41%|████      | 819/2000 [01:22<01:36, 12.26it/s]

Training_loss 1.38798,   Relative Error 0.45163
Training_loss 1.38866,   Relative Error 0.45174
Training_loss 1.38824,   Relative Error 0.45166


 41%|████      | 823/2000 [01:23<01:44, 11.27it/s]

Training_loss 1.38721,   Relative Error 0.45149
Training_loss 1.38405,   Relative Error 0.45100
Training_loss 1.38454,   Relative Error 0.45109


 41%|████▏     | 825/2000 [01:23<01:46, 11.05it/s]

Training_loss 1.38366,   Relative Error 0.45095
Training_loss 1.38278,   Relative Error 0.45081
Training_loss 1.38231,   Relative Error 0.45073


 41%|████▏     | 829/2000 [01:23<01:47, 10.90it/s]

Training_loss 1.38076,   Relative Error 0.45047
Training_loss 1.37910,   Relative Error 0.45018
Training_loss 1.37799,   Relative Error 0.45000


 42%|████▏     | 831/2000 [01:23<01:48, 10.74it/s]

Training_loss 1.37738,   Relative Error 0.44991
Training_loss 1.37700,   Relative Error 0.44986
Training_loss 1.37646,   Relative Error 0.44977


 42%|████▏     | 835/2000 [01:24<01:40, 11.65it/s]

Training_loss 1.37619,   Relative Error 0.44970
Training_loss 1.37759,   Relative Error 0.44994
Training_loss 1.37711,   Relative Error 0.44983


 42%|████▏     | 837/2000 [01:24<01:38, 11.82it/s]

Training_loss 1.37700,   Relative Error 0.44980
Training_loss 1.37736,   Relative Error 0.44983
Training_loss 1.37850,   Relative Error 0.45002


 42%|████▏     | 841/2000 [01:24<01:35, 12.12it/s]

Training_loss 1.38018,   Relative Error 0.45029
Training_loss 1.38081,   Relative Error 0.45040
Training_loss 1.38144,   Relative Error 0.45050


 42%|████▏     | 843/2000 [01:24<01:39, 11.57it/s]

Training_loss 1.38330,   Relative Error 0.45080
Training_loss 1.38248,   Relative Error 0.45069
Training_loss 1.38033,   Relative Error 0.45032


 42%|████▏     | 847/2000 [01:25<01:36, 12.01it/s]

Training_loss 1.37927,   Relative Error 0.45014
Training_loss 1.37980,   Relative Error 0.45024
Training_loss 1.37743,   Relative Error 0.44983


 42%|████▏     | 849/2000 [01:25<01:33, 12.36it/s]

Training_loss 1.37646,   Relative Error 0.44967
Training_loss 1.37695,   Relative Error 0.44974
Training_loss 1.37633,   Relative Error 0.44966


 43%|████▎     | 853/2000 [01:25<01:38, 11.60it/s]

Training_loss 1.37822,   Relative Error 0.44998
Training_loss 1.37622,   Relative Error 0.44966
Training_loss 1.37635,   Relative Error 0.44968


 43%|████▎     | 855/2000 [01:25<01:37, 11.79it/s]

Training_loss 1.37385,   Relative Error 0.44928
Training_loss 1.37233,   Relative Error 0.44904
Training_loss 1.37328,   Relative Error 0.44918


 43%|████▎     | 859/2000 [01:26<01:34, 12.03it/s]

Training_loss 1.37257,   Relative Error 0.44908
Training_loss 1.37160,   Relative Error 0.44892
Training_loss 1.37040,   Relative Error 0.44873


 43%|████▎     | 863/2000 [01:26<01:25, 13.37it/s]

Training_loss 1.36727,   Relative Error 0.44821
Training_loss 1.36634,   Relative Error 0.44807
Training_loss 1.36611,   Relative Error 0.44803
Training_loss 1.36757,   Relative Error 0.44827


 43%|████▎     | 865/2000 [01:26<01:26, 13.12it/s]

Training_loss 1.36763,   Relative Error 0.44828
Training_loss 1.36697,   Relative Error 0.44816
Training_loss 1.36565,   Relative Error 0.44795


 43%|████▎     | 869/2000 [01:26<01:25, 13.16it/s]

Training_loss 1.36525,   Relative Error 0.44786
Training_loss 1.36649,   Relative Error 0.44809
Training_loss 1.36684,   Relative Error 0.44817


 44%|████▎     | 871/2000 [01:27<01:28, 12.74it/s]

Training_loss 1.36599,   Relative Error 0.44803
Training_loss 1.36523,   Relative Error 0.44790
Training_loss 1.36485,   Relative Error 0.44785


 44%|████▍     | 875/2000 [01:27<01:25, 13.12it/s]

Training_loss 1.36481,   Relative Error 0.44783
Training_loss 1.36461,   Relative Error 0.44778
Training_loss 1.36516,   Relative Error 0.44786


 44%|████▍     | 877/2000 [01:27<01:24, 13.22it/s]

Training_loss 1.36533,   Relative Error 0.44788
Training_loss 1.36552,   Relative Error 0.44791
Training_loss 1.36616,   Relative Error 0.44800


 44%|████▍     | 881/2000 [01:27<01:29, 12.44it/s]

Training_loss 1.36504,   Relative Error 0.44782
Training_loss 1.36322,   Relative Error 0.44751
Training_loss 1.36412,   Relative Error 0.44767


 44%|████▍     | 883/2000 [01:27<01:30, 12.33it/s]

Training_loss 1.36465,   Relative Error 0.44775
Training_loss 1.36159,   Relative Error 0.44725
Training_loss 1.36424,   Relative Error 0.44769


 44%|████▍     | 885/2000 [01:28<01:32, 12.12it/s]

Training_loss 1.36240,   Relative Error 0.44737
Training_loss 1.36304,   Relative Error 0.44748


 44%|████▍     | 889/2000 [01:28<01:39, 11.22it/s]

Training_loss 1.36455,   Relative Error 0.44773
Training_loss 1.36415,   Relative Error 0.44765
Training_loss 1.36089,   Relative Error 0.44710


 45%|████▍     | 891/2000 [01:28<01:38, 11.23it/s]

Training_loss 1.35639,   Relative Error 0.44636
Training_loss 1.35884,   Relative Error 0.44676
Training_loss 1.35620,   Relative Error 0.44634


 45%|████▍     | 895/2000 [01:29<01:36, 11.48it/s]

Training_loss 1.35643,   Relative Error 0.44638
Training_loss 1.35755,   Relative Error 0.44657
Training_loss 1.35648,   Relative Error 0.44640


 45%|████▍     | 897/2000 [01:29<01:36, 11.41it/s]

Training_loss 1.35532,   Relative Error 0.44622
Training_loss 1.35576,   Relative Error 0.44630
Training_loss 1.35585,   Relative Error 0.44631


 45%|████▌     | 901/2000 [01:29<01:34, 11.69it/s]

Training_loss 1.35700,   Relative Error 0.44650
Training_loss 1.35788,   Relative Error 0.44664
Training_loss 1.35932,   Relative Error 0.44686


 45%|████▌     | 903/2000 [01:29<01:35, 11.51it/s]

Training_loss 1.35868,   Relative Error 0.44675
Training_loss 1.35838,   Relative Error 0.44671
Training_loss 1.35805,   Relative Error 0.44665


 45%|████▌     | 907/2000 [01:30<01:36, 11.31it/s]

Training_loss 1.35900,   Relative Error 0.44681
Training_loss 1.36001,   Relative Error 0.44695
Training_loss 1.36121,   Relative Error 0.44716


 45%|████▌     | 909/2000 [01:30<01:41, 10.80it/s]

Training_loss 1.36150,   Relative Error 0.44721
Training_loss 1.36207,   Relative Error 0.44730
Training_loss 1.36372,   Relative Error 0.44757


 46%|████▌     | 913/2000 [01:30<01:29, 12.12it/s]

Training_loss 1.36565,   Relative Error 0.44786
Training_loss 1.36332,   Relative Error 0.44747
Training_loss 1.36387,   Relative Error 0.44757


 46%|████▌     | 915/2000 [01:30<01:52,  9.61it/s]

Training_loss 1.36252,   Relative Error 0.44738
Training_loss 1.36097,   Relative Error 0.44711


 46%|████▌     | 917/2000 [01:31<01:54,  9.45it/s]

Training_loss 1.36146,   Relative Error 0.44720
Training_loss 1.36038,   Relative Error 0.44702
Training_loss 1.36191,   Relative Error 0.44725


 46%|████▌     | 921/2000 [01:31<01:47, 10.00it/s]

Training_loss 1.36506,   Relative Error 0.44776
Training_loss 1.36520,   Relative Error 0.44779
Training_loss 1.36757,   Relative Error 0.44818


 46%|████▌     | 923/2000 [01:31<01:40, 10.68it/s]

Training_loss 1.36689,   Relative Error 0.44808
Training_loss 1.36656,   Relative Error 0.44801
Training_loss 1.36822,   Relative Error 0.44827


 46%|████▋     | 925/2000 [01:31<01:41, 10.64it/s]

Training_loss 1.36914,   Relative Error 0.44841
Training_loss 1.37094,   Relative Error 0.44870


 46%|████▋     | 929/2000 [01:32<01:38, 10.86it/s]

Training_loss 1.37058,   Relative Error 0.44861
Training_loss 1.37230,   Relative Error 0.44888
Training_loss 1.37337,   Relative Error 0.44907


 47%|████▋     | 931/2000 [01:32<01:46, 10.07it/s]

Training_loss 1.37377,   Relative Error 0.44914
Training_loss 1.37269,   Relative Error 0.44895


 47%|████▋     | 933/2000 [01:32<01:52,  9.49it/s]

Training_loss 1.37417,   Relative Error 0.44918
Training_loss 1.37409,   Relative Error 0.44918
Training_loss 1.37363,   Relative Error 0.44911


 47%|████▋     | 937/2000 [01:33<01:37, 10.95it/s]

Training_loss 1.37271,   Relative Error 0.44894
Training_loss 1.37524,   Relative Error 0.44935
Training_loss 1.37591,   Relative Error 0.44947


 47%|████▋     | 939/2000 [01:33<01:31, 11.66it/s]

Training_loss 1.37715,   Relative Error 0.44966
Training_loss 1.37560,   Relative Error 0.44938
Training_loss 1.37735,   Relative Error 0.44966


 47%|████▋     | 943/2000 [01:33<01:27, 12.04it/s]

Training_loss 1.37903,   Relative Error 0.44992
Training_loss 1.38178,   Relative Error 0.45036
Training_loss 1.37926,   Relative Error 0.44996


 47%|████▋     | 945/2000 [01:33<01:25, 12.32it/s]

Training_loss 1.37962,   Relative Error 0.45001
Training_loss 1.37974,   Relative Error 0.45005
Training_loss 1.38126,   Relative Error 0.45031


 47%|████▋     | 949/2000 [01:33<01:27, 12.02it/s]

Training_loss 1.37696,   Relative Error 0.44964
Training_loss 1.37598,   Relative Error 0.44949
Training_loss 1.37613,   Relative Error 0.44951


 48%|████▊     | 951/2000 [01:34<01:46,  9.88it/s]

Training_loss 1.37757,   Relative Error 0.44971
Training_loss 1.38014,   Relative Error 0.45014


 48%|████▊     | 954/2000 [01:34<01:59,  8.75it/s]

Training_loss 1.38121,   Relative Error 0.45031
Training_loss 1.38025,   Relative Error 0.45013
Training_loss 1.37838,   Relative Error 0.44980


 48%|████▊     | 955/2000 [01:34<02:02,  8.55it/s]

Training_loss 1.37702,   Relative Error 0.44959
Training_loss 1.37846,   Relative Error 0.44981


 48%|████▊     | 958/2000 [01:35<02:23,  7.25it/s]

Training_loss 1.37936,   Relative Error 0.44994
Training_loss 1.38020,   Relative Error 0.45007


 48%|████▊     | 960/2000 [01:35<02:05,  8.31it/s]

Training_loss 1.38160,   Relative Error 0.45029
Training_loss 1.38297,   Relative Error 0.45052
Training_loss 1.38398,   Relative Error 0.45068


 48%|████▊     | 962/2000 [01:35<01:53,  9.16it/s]

Training_loss 1.38221,   Relative Error 0.45035


 48%|████▊     | 965/2000 [01:36<02:06,  8.16it/s]

Training_loss 1.38428,   Relative Error 0.45069
Training_loss 1.38816,   Relative Error 0.45130
Training_loss 1.38969,   Relative Error 0.45153


 48%|████▊     | 966/2000 [01:36<02:05,  8.23it/s]

Training_loss 1.39169,   Relative Error 0.45186


 48%|████▊     | 968/2000 [01:36<02:25,  7.11it/s]

Training_loss 1.39430,   Relative Error 0.45228
Training_loss 1.39657,   Relative Error 0.45263


 48%|████▊     | 970/2000 [01:36<02:05,  8.22it/s]

Training_loss 1.39383,   Relative Error 0.45220
Training_loss 1.39632,   Relative Error 0.45262
Training_loss 1.39671,   Relative Error 0.45268


 49%|████▊     | 973/2000 [01:36<01:49,  9.40it/s]

Training_loss 1.39681,   Relative Error 0.45270
Training_loss 1.39841,   Relative Error 0.45294


 49%|████▉     | 975/2000 [01:37<02:05,  8.19it/s]

Training_loss 1.39887,   Relative Error 0.45302
Training_loss 1.39921,   Relative Error 0.45305


 49%|████▉     | 977/2000 [01:37<02:01,  8.45it/s]

Training_loss 1.39994,   Relative Error 0.45317
Training_loss 1.40371,   Relative Error 0.45379


 49%|████▉     | 978/2000 [01:37<02:03,  8.28it/s]

Training_loss 1.40177,   Relative Error 0.45348
Training_loss 1.40407,   Relative Error 0.45384


 49%|████▉     | 981/2000 [01:37<01:55,  8.80it/s]

Training_loss 1.40531,   Relative Error 0.45404
Training_loss 1.40577,   Relative Error 0.45409


 49%|████▉     | 983/2000 [01:38<01:45,  9.60it/s]

Training_loss 1.40574,   Relative Error 0.45407
Training_loss 1.40620,   Relative Error 0.45412


 49%|████▉     | 985/2000 [01:38<01:54,  8.88it/s]

Training_loss 1.40574,   Relative Error 0.45401
Training_loss 1.40410,   Relative Error 0.45374
Training_loss 1.40593,   Relative Error 0.45403


 49%|████▉     | 988/2000 [01:38<01:48,  9.36it/s]

Training_loss 1.40861,   Relative Error 0.45447
Training_loss 1.40935,   Relative Error 0.45457


 50%|████▉     | 990/2000 [01:38<01:47,  9.39it/s]

Training_loss 1.40885,   Relative Error 0.45450
Training_loss 1.41109,   Relative Error 0.45488
Training_loss 1.41302,   Relative Error 0.45519


 50%|████▉     | 994/2000 [01:39<01:34, 10.67it/s]

Training_loss 1.41252,   Relative Error 0.45509
Training_loss 1.41044,   Relative Error 0.45477
Training_loss 1.40966,   Relative Error 0.45462


 50%|████▉     | 996/2000 [01:39<01:35, 10.55it/s]

Training_loss 1.41177,   Relative Error 0.45498
Training_loss 1.41132,   Relative Error 0.45490
Training_loss 1.41376,   Relative Error 0.45529


 50%|████▉     | 998/2000 [01:39<01:33, 10.67it/s]

Training_loss 1.41512,   Relative Error 0.45547
Training_loss 1.41718,   Relative Error 0.45580


 50%|█████     | 1000/2000 [01:39<01:39, 10.05it/s]

Training_loss 1.41877,   Relative Error 0.45603
Training_loss 1.41921,   Relative Error 0.45609


 50%|█████     | 1004/2000 [01:40<01:34, 10.49it/s]

Training_loss 1.41823,   Relative Error 0.45594
Training_loss 1.41981,   Relative Error 0.45619
Training_loss 1.42049,   Relative Error 0.45628


 50%|█████     | 1006/2000 [01:40<01:39,  9.98it/s]

Training_loss 1.42190,   Relative Error 0.45651
Training_loss 1.42394,   Relative Error 0.45684


 50%|█████     | 1008/2000 [01:40<01:50,  8.97it/s]

Training_loss 1.42478,   Relative Error 0.45695
Training_loss 1.42742,   Relative Error 0.45737


 51%|█████     | 1011/2000 [01:41<01:44,  9.44it/s]

Training_loss 1.43020,   Relative Error 0.45782
Training_loss 1.42922,   Relative Error 0.45764
Training_loss 1.42930,   Relative Error 0.45764


 51%|█████     | 1013/2000 [01:41<01:40,  9.82it/s]

Training_loss 1.43182,   Relative Error 0.45804
Training_loss 1.43329,   Relative Error 0.45827


 51%|█████     | 1015/2000 [01:41<01:42,  9.60it/s]

Training_loss 1.43326,   Relative Error 0.45826
Training_loss 1.43501,   Relative Error 0.45854
Training_loss 1.43848,   Relative Error 0.45908


 51%|█████     | 1019/2000 [01:41<01:27, 11.19it/s]

Training_loss 1.44096,   Relative Error 0.45948
Training_loss 1.44265,   Relative Error 0.45974
Training_loss 1.44268,   Relative Error 0.45971


 51%|█████     | 1021/2000 [01:41<01:32, 10.55it/s]

Training_loss 1.44446,   Relative Error 0.45997
Training_loss 1.44429,   Relative Error 0.45992
Training_loss 1.44700,   Relative Error 0.46035


 51%|█████▏    | 1025/2000 [01:42<01:26, 11.25it/s]

Training_loss 1.44864,   Relative Error 0.46060
Training_loss 1.44933,   Relative Error 0.46069
Training_loss 1.45069,   Relative Error 0.46090


 51%|█████▏    | 1027/2000 [01:42<01:24, 11.55it/s]

Training_loss 1.45298,   Relative Error 0.46125
Training_loss 1.45460,   Relative Error 0.46149
Training_loss 1.45505,   Relative Error 0.46154


 52%|█████▏    | 1031/2000 [01:42<01:30, 10.70it/s]

Training_loss 1.45710,   Relative Error 0.46186
Training_loss 1.46098,   Relative Error 0.46246
Training_loss 1.46238,   Relative Error 0.46266


 52%|█████▏    | 1033/2000 [01:43<01:29, 10.76it/s]

Training_loss 1.46660,   Relative Error 0.46332
Training_loss 1.46837,   Relative Error 0.46360
Training_loss 1.46958,   Relative Error 0.46375


 52%|█████▏    | 1037/2000 [01:43<01:23, 11.60it/s]

Training_loss 1.47292,   Relative Error 0.46428
Training_loss 1.47297,   Relative Error 0.46426
Training_loss 1.47501,   Relative Error 0.46457


 52%|█████▏    | 1039/2000 [01:43<01:22, 11.70it/s]

Training_loss 1.47672,   Relative Error 0.46483
Training_loss 1.48026,   Relative Error 0.46537
Training_loss 1.48096,   Relative Error 0.46549


 52%|█████▏    | 1043/2000 [01:43<01:26, 11.11it/s]

Training_loss 1.48157,   Relative Error 0.46557
Training_loss 1.48316,   Relative Error 0.46582
Training_loss 1.48502,   Relative Error 0.46608


 52%|█████▏    | 1045/2000 [01:44<01:27, 10.97it/s]

Training_loss 1.48682,   Relative Error 0.46635
Training_loss 1.48973,   Relative Error 0.46678
Training_loss 1.49257,   Relative Error 0.46722


 52%|█████▏    | 1049/2000 [01:44<01:24, 11.20it/s]

Training_loss 1.49318,   Relative Error 0.46728
Training_loss 1.49409,   Relative Error 0.46741
Training_loss 1.49630,   Relative Error 0.46776


 53%|█████▎    | 1051/2000 [01:44<01:20, 11.72it/s]

Training_loss 1.49796,   Relative Error 0.46802
Training_loss 1.49892,   Relative Error 0.46817
Training_loss 1.50155,   Relative Error 0.46858


 53%|█████▎    | 1055/2000 [01:45<01:28, 10.64it/s]

Training_loss 1.50093,   Relative Error 0.46848
Training_loss 1.50460,   Relative Error 0.46905
Training_loss 1.50397,   Relative Error 0.46896


 53%|█████▎    | 1057/2000 [01:45<01:28, 10.62it/s]

Training_loss 1.50724,   Relative Error 0.46946
Training_loss 1.50404,   Relative Error 0.46891
Training_loss 1.50801,   Relative Error 0.46952


 53%|█████▎    | 1061/2000 [01:45<01:31, 10.30it/s]

Training_loss 1.50955,   Relative Error 0.46973
Training_loss 1.51091,   Relative Error 0.46992
Training_loss 1.51326,   Relative Error 0.47029


 53%|█████▎    | 1063/2000 [01:45<01:30, 10.37it/s]

Training_loss 1.51188,   Relative Error 0.47007
Training_loss 1.51140,   Relative Error 0.46999
Training_loss 1.51330,   Relative Error 0.47026


 53%|█████▎    | 1065/2000 [01:45<01:29, 10.49it/s]

Training_loss 1.51559,   Relative Error 0.47058
Training_loss 1.51861,   Relative Error 0.47104


 53%|█████▎    | 1069/2000 [01:46<01:28, 10.47it/s]

Training_loss 1.51837,   Relative Error 0.47104
Training_loss 1.51850,   Relative Error 0.47107
Training_loss 1.51903,   Relative Error 0.47115


 54%|█████▎    | 1071/2000 [01:46<01:23, 11.11it/s]

Training_loss 1.51893,   Relative Error 0.47113
Training_loss 1.52214,   Relative Error 0.47161
Training_loss 1.52264,   Relative Error 0.47167


 54%|█████▍    | 1075/2000 [01:46<01:22, 11.23it/s]

Training_loss 1.52376,   Relative Error 0.47183
Training_loss 1.52641,   Relative Error 0.47223
Training_loss 1.52559,   Relative Error 0.47210


 54%|█████▍    | 1077/2000 [01:47<01:28, 10.46it/s]

Training_loss 1.52435,   Relative Error 0.47193
Training_loss 1.52605,   Relative Error 0.47219
Training_loss 1.52765,   Relative Error 0.47243


 54%|█████▍    | 1081/2000 [01:47<01:25, 10.81it/s]

Training_loss 1.52945,   Relative Error 0.47270
Training_loss 1.53209,   Relative Error 0.47308
Training_loss 1.53496,   Relative Error 0.47354


 54%|█████▍    | 1083/2000 [01:47<01:24, 10.88it/s]

Training_loss 1.53605,   Relative Error 0.47368
Training_loss 1.53716,   Relative Error 0.47386
Training_loss 1.53930,   Relative Error 0.47419


 54%|█████▍    | 1087/2000 [01:47<01:18, 11.59it/s]

Training_loss 1.54040,   Relative Error 0.47436
Training_loss 1.53691,   Relative Error 0.47380
Training_loss 1.53870,   Relative Error 0.47409


 54%|█████▍    | 1089/2000 [01:48<01:19, 11.49it/s]

Training_loss 1.54103,   Relative Error 0.47445
Training_loss 1.54098,   Relative Error 0.47448
Training_loss 1.54474,   Relative Error 0.47504


 55%|█████▍    | 1093/2000 [01:48<01:16, 11.81it/s]

Training_loss 1.54490,   Relative Error 0.47503
Training_loss 1.54628,   Relative Error 0.47524
Training_loss 1.54850,   Relative Error 0.47557


 55%|█████▍    | 1095/2000 [01:48<01:17, 11.67it/s]

Training_loss 1.54735,   Relative Error 0.47542
Training_loss 1.55066,   Relative Error 0.47592
Training_loss 1.55061,   Relative Error 0.47593


 55%|█████▍    | 1099/2000 [01:49<01:23, 10.82it/s]

Training_loss 1.55090,   Relative Error 0.47598
Training_loss 1.55420,   Relative Error 0.47646
Training_loss 1.55454,   Relative Error 0.47649


 55%|█████▌    | 1101/2000 [01:49<01:27, 10.30it/s]

Training_loss 1.55500,   Relative Error 0.47654
Training_loss 1.55896,   Relative Error 0.47714
Training_loss 1.56098,   Relative Error 0.47744


 55%|█████▌    | 1105/2000 [01:49<01:22, 10.80it/s]

Training_loss 1.56298,   Relative Error 0.47773
Training_loss 1.56703,   Relative Error 0.47832
Training_loss 1.56635,   Relative Error 0.47820


 55%|█████▌    | 1107/2000 [01:49<01:21, 11.02it/s]

Training_loss 1.56825,   Relative Error 0.47844
Training_loss 1.57115,   Relative Error 0.47886
Training_loss 1.57278,   Relative Error 0.47909


 55%|█████▌    | 1109/2000 [01:49<01:19, 11.16it/s]

Training_loss 1.57493,   Relative Error 0.47940
Training_loss 1.57586,   Relative Error 0.47953


 56%|█████▌    | 1113/2000 [01:50<01:26, 10.24it/s]

Training_loss 1.57733,   Relative Error 0.47974
Training_loss 1.57778,   Relative Error 0.47980
Training_loss 1.57846,   Relative Error 0.47991


 56%|█████▌    | 1115/2000 [01:50<01:24, 10.46it/s]

Training_loss 1.57632,   Relative Error 0.47959
Training_loss 1.57705,   Relative Error 0.47966
Training_loss 1.57684,   Relative Error 0.47962


 56%|█████▌    | 1117/2000 [01:50<01:24, 10.48it/s]

Training_loss 1.57656,   Relative Error 0.47954
Training_loss 1.57893,   Relative Error 0.47991


 56%|█████▌    | 1121/2000 [01:51<01:26, 10.17it/s]

Training_loss 1.57429,   Relative Error 0.47922
Training_loss 1.57430,   Relative Error 0.47923
Training_loss 1.57902,   Relative Error 0.47993


 56%|█████▌    | 1123/2000 [01:51<01:26, 10.14it/s]

Training_loss 1.58151,   Relative Error 0.48027
Training_loss 1.58274,   Relative Error 0.48043
Training_loss 1.58535,   Relative Error 0.48085


 56%|█████▋    | 1127/2000 [01:51<01:22, 10.52it/s]

Training_loss 1.58580,   Relative Error 0.48089
Training_loss 1.58658,   Relative Error 0.48098
Training_loss 1.58982,   Relative Error 0.48147


 56%|█████▋    | 1129/2000 [01:51<01:18, 11.08it/s]

Training_loss 1.59056,   Relative Error 0.48155
Training_loss 1.59034,   Relative Error 0.48150
Training_loss 1.58988,   Relative Error 0.48140


 57%|█████▋    | 1133/2000 [01:52<01:14, 11.71it/s]

Training_loss 1.59138,   Relative Error 0.48165
Training_loss 1.59359,   Relative Error 0.48196
Training_loss 1.59681,   Relative Error 0.48244


 57%|█████▋    | 1135/2000 [01:52<01:14, 11.57it/s]

Training_loss 1.59756,   Relative Error 0.48256
Training_loss 1.59773,   Relative Error 0.48258


 57%|█████▋    | 1137/2000 [01:52<01:23, 10.33it/s]

Training_loss 1.59988,   Relative Error 0.48288
Training_loss 1.59919,   Relative Error 0.48276
Training_loss 1.60128,   Relative Error 0.48303


 57%|█████▋    | 1139/2000 [01:52<01:21, 10.59it/s]

Training_loss 1.60277,   Relative Error 0.48324
Training_loss 1.60425,   Relative Error 0.48346


 57%|█████▋    | 1143/2000 [01:53<01:27,  9.79it/s]

Training_loss 1.60553,   Relative Error 0.48365
Training_loss 1.60547,   Relative Error 0.48363
Training_loss 1.60347,   Relative Error 0.48330


 57%|█████▋    | 1146/2000 [01:53<01:25, 10.03it/s]

Training_loss 1.60370,   Relative Error 0.48330
Training_loss 1.60747,   Relative Error 0.48387
Training_loss 1.60835,   Relative Error 0.48402


 57%|█████▋    | 1148/2000 [01:53<01:30,  9.41it/s]

Training_loss 1.60984,   Relative Error 0.48420
Training_loss 1.61291,   Relative Error 0.48462
Training_loss 1.61636,   Relative Error 0.48511


 58%|█████▊    | 1152/2000 [01:54<01:20, 10.49it/s]

Training_loss 1.61890,   Relative Error 0.48549
Training_loss 1.62105,   Relative Error 0.48580
Training_loss 1.62364,   Relative Error 0.48616


 58%|█████▊    | 1154/2000 [01:54<01:18, 10.72it/s]

Training_loss 1.62337,   Relative Error 0.48610
Training_loss 1.62662,   Relative Error 0.48657
Training_loss 1.62844,   Relative Error 0.48683


 58%|█████▊    | 1158/2000 [01:54<01:18, 10.79it/s]

Training_loss 1.63227,   Relative Error 0.48737
Training_loss 1.63601,   Relative Error 0.48791
Training_loss 1.63502,   Relative Error 0.48775


 58%|█████▊    | 1160/2000 [01:54<01:17, 10.88it/s]

Training_loss 1.63722,   Relative Error 0.48807
Training_loss 1.63865,   Relative Error 0.48829
Training_loss 1.63508,   Relative Error 0.48772


 58%|█████▊    | 1164/2000 [01:55<01:17, 10.75it/s]

Training_loss 1.63644,   Relative Error 0.48790
Training_loss 1.63956,   Relative Error 0.48835
Training_loss 1.64149,   Relative Error 0.48862


 58%|█████▊    | 1166/2000 [01:55<01:17, 10.72it/s]

Training_loss 1.64415,   Relative Error 0.48901
Training_loss 1.64241,   Relative Error 0.48875


 58%|█████▊    | 1168/2000 [01:55<01:21, 10.15it/s]

Training_loss 1.64472,   Relative Error 0.48910
Training_loss 1.64698,   Relative Error 0.48941
Training_loss 1.64644,   Relative Error 0.48931


 59%|█████▊    | 1172/2000 [01:55<01:16, 10.81it/s]

Training_loss 1.64820,   Relative Error 0.48957
Training_loss 1.64922,   Relative Error 0.48970
Training_loss 1.65054,   Relative Error 0.48991


 59%|█████▊    | 1174/2000 [01:56<01:16, 10.74it/s]

Training_loss 1.65216,   Relative Error 0.49014
Training_loss 1.65436,   Relative Error 0.49045
Training_loss 1.65678,   Relative Error 0.49079


 59%|█████▉    | 1178/2000 [01:56<01:14, 11.11it/s]

Training_loss 1.65229,   Relative Error 0.49012
Training_loss 1.65600,   Relative Error 0.49068
Training_loss 1.66058,   Relative Error 0.49133


 59%|█████▉    | 1180/2000 [01:56<01:14, 11.06it/s]

Training_loss 1.66364,   Relative Error 0.49176
Training_loss 1.66542,   Relative Error 0.49202
Training_loss 1.66528,   Relative Error 0.49198


 59%|█████▉    | 1184/2000 [01:57<01:16, 10.61it/s]

Training_loss 1.66455,   Relative Error 0.49187
Training_loss 1.66734,   Relative Error 0.49224
Training_loss 1.67184,   Relative Error 0.49288


 59%|█████▉    | 1186/2000 [01:57<01:20, 10.12it/s]

Training_loss 1.66565,   Relative Error 0.49198
Training_loss 1.66765,   Relative Error 0.49224
Training_loss 1.67054,   Relative Error 0.49267


 59%|█████▉    | 1188/2000 [01:57<01:18, 10.32it/s]

Training_loss 1.67416,   Relative Error 0.49317
Training_loss 1.67659,   Relative Error 0.49349


 60%|█████▉    | 1192/2000 [01:57<01:17, 10.36it/s]

Training_loss 1.67963,   Relative Error 0.49392
Training_loss 1.68184,   Relative Error 0.49423
Training_loss 1.68357,   Relative Error 0.49446


 60%|█████▉    | 1194/2000 [01:58<01:16, 10.53it/s]

Training_loss 1.67908,   Relative Error 0.49379
Training_loss 1.68123,   Relative Error 0.49411
Training_loss 1.68064,   Relative Error 0.49400


 60%|█████▉    | 1196/2000 [01:58<01:15, 10.61it/s]

Training_loss 1.68480,   Relative Error 0.49459
Training_loss 1.68787,   Relative Error 0.49500


 60%|██████    | 1200/2000 [01:58<01:19, 10.06it/s]

Training_loss 1.69147,   Relative Error 0.49551
Training_loss 1.69438,   Relative Error 0.49596
Training_loss 1.69900,   Relative Error 0.49660


 60%|██████    | 1202/2000 [01:58<01:17, 10.35it/s]

Training_loss 1.70030,   Relative Error 0.49679
Training_loss 1.70145,   Relative Error 0.49696
Training_loss 1.69869,   Relative Error 0.49654


 60%|██████    | 1206/2000 [01:59<01:10, 11.34it/s]

Training_loss 1.70164,   Relative Error 0.49694
Training_loss 1.70532,   Relative Error 0.49748
Training_loss 1.70479,   Relative Error 0.49740


 60%|██████    | 1208/2000 [01:59<01:07, 11.70it/s]

Training_loss 1.70954,   Relative Error 0.49805
Training_loss 1.71301,   Relative Error 0.49853
Training_loss 1.71399,   Relative Error 0.49869


 61%|██████    | 1212/2000 [01:59<01:02, 12.57it/s]

Training_loss 1.71828,   Relative Error 0.49929
Training_loss 1.71808,   Relative Error 0.49925
Training_loss 1.71963,   Relative Error 0.49948


 61%|██████    | 1214/2000 [01:59<01:06, 11.85it/s]

Training_loss 1.72343,   Relative Error 0.50002
Training_loss 1.72542,   Relative Error 0.50029
Training_loss 1.72463,   Relative Error 0.50017


 61%|██████    | 1216/2000 [02:00<01:08, 11.48it/s]

Training_loss 1.72567,   Relative Error 0.50030
Training_loss 1.72709,   Relative Error 0.50049


 61%|██████    | 1220/2000 [02:00<01:11, 10.88it/s]

Training_loss 1.73042,   Relative Error 0.50096
Training_loss 1.73215,   Relative Error 0.50121
Training_loss 1.73062,   Relative Error 0.50098


 61%|██████    | 1222/2000 [02:00<01:09, 11.11it/s]

Training_loss 1.73209,   Relative Error 0.50120
Training_loss 1.73606,   Relative Error 0.50175
Training_loss 1.73821,   Relative Error 0.50203


 61%|██████▏   | 1226/2000 [02:00<01:09, 11.19it/s]

Training_loss 1.73942,   Relative Error 0.50213
Training_loss 1.74235,   Relative Error 0.50257
Training_loss 1.74074,   Relative Error 0.50229


 61%|██████▏   | 1228/2000 [02:01<01:11, 10.73it/s]

Training_loss 1.74091,   Relative Error 0.50230
Training_loss 1.74505,   Relative Error 0.50287
Training_loss 1.74497,   Relative Error 0.50283


 62%|██████▏   | 1232/2000 [02:01<01:13, 10.44it/s]

Training_loss 1.74901,   Relative Error 0.50339
Training_loss 1.75238,   Relative Error 0.50386
Training_loss 1.75105,   Relative Error 0.50369


 62%|██████▏   | 1234/2000 [02:01<01:13, 10.47it/s]

Training_loss 1.74585,   Relative Error 0.50293
Training_loss 1.74910,   Relative Error 0.50338


 62%|██████▏   | 1236/2000 [02:01<01:16, 10.01it/s]

Training_loss 1.75390,   Relative Error 0.50407
Training_loss 1.75438,   Relative Error 0.50411
Training_loss 1.75418,   Relative Error 0.50406


 62%|██████▏   | 1240/2000 [02:02<01:08, 11.15it/s]

Training_loss 1.75648,   Relative Error 0.50438
Training_loss 1.75703,   Relative Error 0.50443
Training_loss 1.75905,   Relative Error 0.50469


 62%|██████▏   | 1242/2000 [02:02<01:05, 11.58it/s]

Training_loss 1.76153,   Relative Error 0.50501
Training_loss 1.76593,   Relative Error 0.50563
Training_loss 1.76727,   Relative Error 0.50580


 62%|██████▏   | 1246/2000 [02:02<01:03, 11.92it/s]

Training_loss 1.77106,   Relative Error 0.50630
Training_loss 1.77292,   Relative Error 0.50658
Training_loss 1.77635,   Relative Error 0.50706


 62%|██████▏   | 1248/2000 [02:02<01:03, 11.90it/s]

Training_loss 1.78049,   Relative Error 0.50764
Training_loss 1.78255,   Relative Error 0.50791
Training_loss 1.78307,   Relative Error 0.50798


 63%|██████▎   | 1252/2000 [02:03<01:05, 11.46it/s]

Training_loss 1.78543,   Relative Error 0.50830
Training_loss 1.78911,   Relative Error 0.50878
Training_loss 1.79005,   Relative Error 0.50891


 63%|██████▎   | 1254/2000 [02:03<01:02, 12.01it/s]

Training_loss 1.78965,   Relative Error 0.50883
Training_loss 1.78967,   Relative Error 0.50883
Training_loss 1.78924,   Relative Error 0.50878


 63%|██████▎   | 1258/2000 [02:03<00:59, 12.55it/s]

Training_loss 1.79416,   Relative Error 0.50945
Training_loss 1.79877,   Relative Error 0.51009
Training_loss 1.80015,   Relative Error 0.51027


 63%|██████▎   | 1260/2000 [02:03<01:00, 12.25it/s]

Training_loss 1.80335,   Relative Error 0.51071
Training_loss 1.80594,   Relative Error 0.51106


 63%|██████▎   | 1262/2000 [02:04<01:04, 11.45it/s]

Training_loss 1.80981,   Relative Error 0.51160
Training_loss 1.81249,   Relative Error 0.51197
Training_loss 1.81516,   Relative Error 0.51232


 63%|██████▎   | 1266/2000 [02:04<01:03, 11.61it/s]

Training_loss 1.81952,   Relative Error 0.51290
Training_loss 1.82390,   Relative Error 0.51351
Training_loss 1.82439,   Relative Error 0.51354


 63%|██████▎   | 1268/2000 [02:04<01:05, 11.21it/s]

Training_loss 1.82981,   Relative Error 0.51427
Training_loss 1.83241,   Relative Error 0.51462
Training_loss 1.83585,   Relative Error 0.51510


 64%|██████▎   | 1272/2000 [02:04<01:04, 11.37it/s]

Training_loss 1.83781,   Relative Error 0.51537
Training_loss 1.83742,   Relative Error 0.51533
Training_loss 1.83708,   Relative Error 0.51529


 64%|██████▎   | 1274/2000 [02:05<01:02, 11.56it/s]

Training_loss 1.84127,   Relative Error 0.51586
Training_loss 1.84224,   Relative Error 0.51597
Training_loss 1.84609,   Relative Error 0.51650


 64%|██████▍   | 1276/2000 [02:05<01:07, 10.69it/s]

Training_loss 1.84777,   Relative Error 0.51673
Training_loss 1.84904,   Relative Error 0.51688


 64%|██████▍   | 1278/2000 [02:05<01:12, 10.01it/s]

Training_loss 1.84843,   Relative Error 0.51683
Training_loss 1.85126,   Relative Error 0.51723


 64%|██████▍   | 1282/2000 [02:06<01:15,  9.46it/s]

Training_loss 1.85442,   Relative Error 0.51764
Training_loss 1.85291,   Relative Error 0.51748
Training_loss 1.85476,   Relative Error 0.51772


 64%|██████▍   | 1285/2000 [02:06<01:12,  9.88it/s]

Training_loss 1.85718,   Relative Error 0.51804
Training_loss 1.85676,   Relative Error 0.51801
Training_loss 1.86154,   Relative Error 0.51867


 64%|██████▍   | 1287/2000 [02:06<01:06, 10.68it/s]

Training_loss 1.86608,   Relative Error 0.51929
Training_loss 1.86460,   Relative Error 0.51909
Training_loss 1.86856,   Relative Error 0.51960


 65%|██████▍   | 1291/2000 [02:06<00:59, 11.83it/s]

Training_loss 1.86786,   Relative Error 0.51951
Training_loss 1.87066,   Relative Error 0.51992
Training_loss 1.87094,   Relative Error 0.51995


 65%|██████▍   | 1293/2000 [02:06<00:57, 12.20it/s]

Training_loss 1.87413,   Relative Error 0.52039
Training_loss 1.87574,   Relative Error 0.52060
Training_loss 1.87970,   Relative Error 0.52113


 65%|██████▍   | 1297/2000 [02:07<01:00, 11.60it/s]

Training_loss 1.88289,   Relative Error 0.52155
Training_loss 1.88777,   Relative Error 0.52220
Training_loss 1.89047,   Relative Error 0.52255


 65%|██████▍   | 1299/2000 [02:07<01:03, 11.12it/s]

Training_loss 1.89443,   Relative Error 0.52308
Training_loss 1.89523,   Relative Error 0.52315
Training_loss 1.89914,   Relative Error 0.52366


 65%|██████▌   | 1303/2000 [02:07<01:05, 10.68it/s]

Training_loss 1.90339,   Relative Error 0.52423
Training_loss 1.90469,   Relative Error 0.52435
Training_loss 1.90189,   Relative Error 0.52393


 65%|██████▌   | 1305/2000 [02:08<01:04, 10.80it/s]

Training_loss 1.90300,   Relative Error 0.52409
Training_loss 1.90323,   Relative Error 0.52408
Training_loss 1.90298,   Relative Error 0.52405

 65%|██████▌   | 1307/2000 [02:08<01:03, 10.99it/s]


Training_loss 1.90490,   Relative Error 0.52431
Training_loss 1.90499,   Relative Error 0.52432


 66%|██████▌   | 1311/2000 [02:08<00:59, 11.58it/s]

Training_loss 1.90712,   Relative Error 0.52459
Training_loss 1.91221,   Relative Error 0.52524
Training_loss 1.91029,   Relative Error 0.52494


 66%|██████▌   | 1313/2000 [02:08<00:57, 11.93it/s]

Training_loss 1.91639,   Relative Error 0.52577
Training_loss 1.92027,   Relative Error 0.52628
Training_loss 1.92379,   Relative Error 0.52672


 66%|██████▌   | 1317/2000 [02:09<00:55, 12.26it/s]

Training_loss 1.92431,   Relative Error 0.52676
Training_loss 1.92372,   Relative Error 0.52664
Training_loss 1.92759,   Relative Error 0.52716


 66%|██████▌   | 1319/2000 [02:09<00:54, 12.61it/s]

Training_loss 1.93085,   Relative Error 0.52760
Training_loss 1.93420,   Relative Error 0.52807
Training_loss 1.93668,   Relative Error 0.52839


 66%|██████▌   | 1323/2000 [02:09<00:56, 11.97it/s]

Training_loss 1.93653,   Relative Error 0.52837
Training_loss 1.94089,   Relative Error 0.52891
Training_loss 1.94126,   Relative Error 0.52898


 66%|██████▋   | 1325/2000 [02:09<00:55, 12.24it/s]

Training_loss 1.94160,   Relative Error 0.52905
Training_loss 1.94636,   Relative Error 0.52965
Training_loss 1.95042,   Relative Error 0.53020


 66%|██████▋   | 1329/2000 [02:10<00:53, 12.52it/s]

Training_loss 1.95458,   Relative Error 0.53072
Training_loss 1.96006,   Relative Error 0.53142
Training_loss 1.96321,   Relative Error 0.53186


 67%|██████▋   | 1331/2000 [02:10<00:54, 12.31it/s]

Training_loss 1.96263,   Relative Error 0.53174
Training_loss 1.96251,   Relative Error 0.53170
Training_loss 1.96451,   Relative Error 0.53191


 67%|██████▋   | 1335/2000 [02:10<00:54, 12.23it/s]

Training_loss 1.96533,   Relative Error 0.53202
Training_loss 1.96858,   Relative Error 0.53246
Training_loss 1.97115,   Relative Error 0.53276


 67%|██████▋   | 1337/2000 [02:10<00:54, 12.19it/s]

Training_loss 1.97239,   Relative Error 0.53295
Training_loss 1.97704,   Relative Error 0.53354
Training_loss 1.97733,   Relative Error 0.53358


 67%|██████▋   | 1341/2000 [02:11<00:53, 12.39it/s]

Training_loss 1.97934,   Relative Error 0.53387
Training_loss 1.98346,   Relative Error 0.53441
Training_loss 1.98148,   Relative Error 0.53412


 67%|██████▋   | 1343/2000 [02:11<00:52, 12.43it/s]

Training_loss 1.98716,   Relative Error 0.53486
Training_loss 1.99193,   Relative Error 0.53548
Training_loss 1.99190,   Relative Error 0.53547


 67%|██████▋   | 1347/2000 [02:11<00:51, 12.58it/s]

Training_loss 1.99422,   Relative Error 0.53577
Training_loss 1.99406,   Relative Error 0.53576
Training_loss 1.99558,   Relative Error 0.53596


 67%|██████▋   | 1349/2000 [02:11<00:52, 12.33it/s]

Training_loss 1.99780,   Relative Error 0.53625
Training_loss 2.00163,   Relative Error 0.53672
Training_loss 2.00276,   Relative Error 0.53683


 68%|██████▊   | 1353/2000 [02:12<00:54, 11.79it/s]

Training_loss 1.99990,   Relative Error 0.53648
Training_loss 2.00420,   Relative Error 0.53705
Training_loss 2.00743,   Relative Error 0.53751


 68%|██████▊   | 1355/2000 [02:12<00:55, 11.58it/s]

Training_loss 2.00729,   Relative Error 0.53744
Training_loss 2.00951,   Relative Error 0.53770
Training_loss 2.01299,   Relative Error 0.53815


 68%|██████▊   | 1359/2000 [02:12<00:59, 10.82it/s]

Training_loss 2.01060,   Relative Error 0.53785
Training_loss 2.01141,   Relative Error 0.53791
Training_loss 2.01695,   Relative Error 0.53863


 68%|██████▊   | 1361/2000 [02:12<01:04,  9.86it/s]

Training_loss 2.01982,   Relative Error 0.53898
Training_loss 2.02266,   Relative Error 0.53935


 68%|██████▊   | 1363/2000 [02:13<01:11,  8.96it/s]

Training_loss 2.02443,   Relative Error 0.53958
Training_loss 2.02461,   Relative Error 0.53957


 68%|██████▊   | 1365/2000 [02:13<01:13,  8.58it/s]

Training_loss 2.02341,   Relative Error 0.53939
Training_loss 2.02728,   Relative Error 0.53991


 68%|██████▊   | 1367/2000 [02:13<01:17,  8.12it/s]

Training_loss 2.03134,   Relative Error 0.54042
Training_loss 2.03634,   Relative Error 0.54107


 68%|██████▊   | 1369/2000 [02:13<01:26,  7.26it/s]

Training_loss 2.03805,   Relative Error 0.54132
Training_loss 2.03992,   Relative Error 0.54152


 69%|██████▊   | 1371/2000 [02:14<01:22,  7.66it/s]

Training_loss 2.04322,   Relative Error 0.54193
Training_loss 2.04847,   Relative Error 0.54258


 69%|██████▊   | 1373/2000 [02:14<01:37,  6.40it/s]

Training_loss 2.04953,   Relative Error 0.54271
Training_loss 2.05176,   Relative Error 0.54301
Training_loss 2.05208,   Relative Error 0.54304


 69%|██████▉   | 1376/2000 [02:14<01:21,  7.70it/s]

Training_loss 2.05317,   Relative Error 0.54319
Training_loss 2.04935,   Relative Error 0.54273


 69%|██████▉   | 1377/2000 [02:15<01:34,  6.62it/s]

Training_loss 2.05459,   Relative Error 0.54338


 69%|██████▉   | 1379/2000 [02:15<01:36,  6.40it/s]

Training_loss 2.05489,   Relative Error 0.54342
Training_loss 2.05864,   Relative Error 0.54389


 69%|██████▉   | 1381/2000 [02:15<01:49,  5.63it/s]

Training_loss 2.06265,   Relative Error 0.54441
Training_loss 2.05708,   Relative Error 0.54365


 69%|██████▉   | 1383/2000 [02:16<01:31,  6.76it/s]

Training_loss 2.05948,   Relative Error 0.54397
Training_loss 2.05902,   Relative Error 0.54383


 69%|██████▉   | 1385/2000 [02:16<01:18,  7.85it/s]

Training_loss 2.06396,   Relative Error 0.54449
Training_loss 2.06867,   Relative Error 0.54508
Training_loss 2.06540,   Relative Error 0.54459


 69%|██████▉   | 1387/2000 [02:16<01:08,  8.89it/s]

Training_loss 2.06461,   Relative Error 0.54453
Training_loss 2.06795,   Relative Error 0.54495


 70%|██████▉   | 1391/2000 [02:16<01:01,  9.84it/s]

Training_loss 2.07224,   Relative Error 0.54550
Training_loss 2.06956,   Relative Error 0.54518
Training_loss 2.07259,   Relative Error 0.54556


 70%|██████▉   | 1393/2000 [02:17<00:58, 10.35it/s]

Training_loss 2.07445,   Relative Error 0.54574
Training_loss 2.07455,   Relative Error 0.54576
Training_loss 2.07968,   Relative Error 0.54637


 70%|██████▉   | 1397/2000 [02:17<00:54, 10.99it/s]

Training_loss 2.08139,   Relative Error 0.54659
Training_loss 2.08574,   Relative Error 0.54715
Training_loss 2.08764,   Relative Error 0.54737


 70%|██████▉   | 1399/2000 [02:17<00:52, 11.48it/s]

Training_loss 2.08455,   Relative Error 0.54694
Training_loss 2.08458,   Relative Error 0.54689
Training_loss 2.08685,   Relative Error 0.54717


 70%|███████   | 1403/2000 [02:17<00:51, 11.56it/s]

Training_loss 2.09087,   Relative Error 0.54766
Training_loss 2.08939,   Relative Error 0.54742
Training_loss 2.09111,   Relative Error 0.54762


 70%|███████   | 1405/2000 [02:18<00:49, 11.94it/s]

Training_loss 2.09454,   Relative Error 0.54802
Training_loss 2.09457,   Relative Error 0.54804
Training_loss 2.09154,   Relative Error 0.54761


 70%|███████   | 1409/2000 [02:18<00:49, 12.00it/s]

Training_loss 2.09293,   Relative Error 0.54784
Training_loss 2.09170,   Relative Error 0.54767
Training_loss 2.09615,   Relative Error 0.54823


 71%|███████   | 1411/2000 [02:18<00:48, 12.26it/s]

Training_loss 2.09725,   Relative Error 0.54835
Training_loss 2.09712,   Relative Error 0.54829
Training_loss 2.09886,   Relative Error 0.54851


 71%|███████   | 1415/2000 [02:18<00:51, 11.46it/s]

Training_loss 2.10112,   Relative Error 0.54877
Training_loss 2.10414,   Relative Error 0.54919
Training_loss 2.10501,   Relative Error 0.54929


 71%|███████   | 1417/2000 [02:19<00:49, 11.73it/s]

Training_loss 2.10715,   Relative Error 0.54952
Training_loss 2.10237,   Relative Error 0.54887
Training_loss 2.10192,   Relative Error 0.54882


 71%|███████   | 1421/2000 [02:19<00:49, 11.61it/s]

Training_loss 2.10373,   Relative Error 0.54900
Training_loss 2.10739,   Relative Error 0.54946
Training_loss 2.10910,   Relative Error 0.54964


 71%|███████   | 1423/2000 [02:19<00:49, 11.76it/s]

Training_loss 2.11172,   Relative Error 0.54998
Training_loss 2.11574,   Relative Error 0.55047
Training_loss 2.12088,   Relative Error 0.55113


 71%|███████▏  | 1427/2000 [02:19<00:46, 12.25it/s]

Training_loss 2.12232,   Relative Error 0.55130
Training_loss 2.12251,   Relative Error 0.55137
Training_loss 2.12577,   Relative Error 0.55179


 71%|███████▏  | 1429/2000 [02:20<00:47, 12.09it/s]

Training_loss 2.12585,   Relative Error 0.55178
Training_loss 2.12855,   Relative Error 0.55212
Training_loss 2.12976,   Relative Error 0.55227


 72%|███████▏  | 1433/2000 [02:20<00:50, 11.33it/s]

Training_loss 2.12920,   Relative Error 0.55220
Training_loss 2.13198,   Relative Error 0.55253
Training_loss 2.13612,   Relative Error 0.55304


 72%|███████▏  | 1435/2000 [02:20<00:48, 11.77it/s]

Training_loss 2.14188,   Relative Error 0.55376
Training_loss 2.14257,   Relative Error 0.55385
Training_loss 2.14553,   Relative Error 0.55420


 72%|███████▏  | 1437/2000 [02:20<00:47, 11.91it/s]

Training_loss 2.14768,   Relative Error 0.55440
Training_loss 2.14945,   Relative Error 0.55464


 72%|███████▏  | 1441/2000 [02:21<00:52, 10.56it/s]

Training_loss 2.15285,   Relative Error 0.55508
Training_loss 2.15828,   Relative Error 0.55575
Training_loss 2.16157,   Relative Error 0.55616


 72%|███████▏  | 1443/2000 [02:21<00:52, 10.60it/s]

Training_loss 2.16338,   Relative Error 0.55638
Training_loss 2.16150,   Relative Error 0.55618
Training_loss 2.16378,   Relative Error 0.55647


 72%|███████▏  | 1447/2000 [02:21<00:49, 11.28it/s]

Training_loss 2.16486,   Relative Error 0.55659
Training_loss 2.16077,   Relative Error 0.55607
Training_loss 2.16692,   Relative Error 0.55685


 72%|███████▏  | 1449/2000 [02:21<00:53, 10.23it/s]

Training_loss 2.17181,   Relative Error 0.55747
Training_loss 2.16721,   Relative Error 0.55682
Training_loss 2.17112,   Relative Error 0.55728


 73%|███████▎  | 1453/2000 [02:22<00:49, 11.16it/s]

Training_loss 2.17208,   Relative Error 0.55738
Training_loss 2.17689,   Relative Error 0.55800
Training_loss 2.17931,   Relative Error 0.55832


 73%|███████▎  | 1455/2000 [02:22<00:46, 11.61it/s]

Training_loss 2.18038,   Relative Error 0.55840
Training_loss 2.17825,   Relative Error 0.55809
Training_loss 2.17822,   Relative Error 0.55808


 73%|███████▎  | 1459/2000 [02:22<00:45, 11.97it/s]

Training_loss 2.18143,   Relative Error 0.55849
Training_loss 2.18589,   Relative Error 0.55903
Training_loss 2.18813,   Relative Error 0.55928


 73%|███████▎  | 1461/2000 [02:22<00:44, 12.12it/s]

Training_loss 2.18890,   Relative Error 0.55935
Training_loss 2.18959,   Relative Error 0.55940
Training_loss 2.18913,   Relative Error 0.55931


 73%|███████▎  | 1465/2000 [02:23<00:45, 11.87it/s]

Training_loss 2.18621,   Relative Error 0.55883
Training_loss 2.18768,   Relative Error 0.55900
Training_loss 2.19132,   Relative Error 0.55944


 73%|███████▎  | 1467/2000 [02:23<00:43, 12.20it/s]

Training_loss 2.19219,   Relative Error 0.55960
Training_loss 2.19633,   Relative Error 0.56011
Training_loss 2.19865,   Relative Error 0.56038


 74%|███████▎  | 1471/2000 [02:23<00:43, 12.17it/s]

Training_loss 2.20229,   Relative Error 0.56079
Training_loss 2.20611,   Relative Error 0.56126
Training_loss 2.20389,   Relative Error 0.56098


 74%|███████▎  | 1473/2000 [02:23<00:43, 12.11it/s]

Training_loss 2.20327,   Relative Error 0.56095
Training_loss 2.20081,   Relative Error 0.56059
Training_loss 2.20559,   Relative Error 0.56119


 74%|███████▍  | 1477/2000 [02:24<00:41, 12.61it/s]

Training_loss 2.20791,   Relative Error 0.56143
Training_loss 2.20935,   Relative Error 0.56162
Training_loss 2.21333,   Relative Error 0.56211


 74%|███████▍  | 1479/2000 [02:24<00:42, 12.26it/s]

Training_loss 2.21520,   Relative Error 0.56236
Training_loss 2.21589,   Relative Error 0.56247
Training_loss 2.21718,   Relative Error 0.56262


 74%|███████▍  | 1483/2000 [02:24<00:47, 10.85it/s]

Training_loss 2.21809,   Relative Error 0.56270
Training_loss 2.21637,   Relative Error 0.56249
Training_loss 2.21841,   Relative Error 0.56277


 74%|███████▍  | 1485/2000 [02:25<00:48, 10.70it/s]

Training_loss 2.21940,   Relative Error 0.56281
Training_loss 2.21927,   Relative Error 0.56276
Training_loss 2.22169,   Relative Error 0.56302


 74%|███████▍  | 1489/2000 [02:25<00:47, 10.73it/s]

Training_loss 2.22396,   Relative Error 0.56330
Training_loss 2.22865,   Relative Error 0.56387
Training_loss 2.23013,   Relative Error 0.56408


 75%|███████▍  | 1491/2000 [02:25<00:47, 10.80it/s]

Training_loss 2.22927,   Relative Error 0.56401
Training_loss 2.23298,   Relative Error 0.56446


 75%|███████▍  | 1493/2000 [02:25<00:48, 10.36it/s]

Training_loss 2.23744,   Relative Error 0.56502
Training_loss 2.23558,   Relative Error 0.56476
Training_loss 2.24048,   Relative Error 0.56533


 75%|███████▍  | 1495/2000 [02:26<00:51,  9.72it/s]

Training_loss 2.24090,   Relative Error 0.56539
Training_loss 2.24374,   Relative Error 0.56573


 75%|███████▍  | 1498/2000 [02:26<00:57,  8.72it/s]

Training_loss 2.24282,   Relative Error 0.56556
Training_loss 2.24758,   Relative Error 0.56617
Training_loss 2.25117,   Relative Error 0.56662


 75%|███████▌  | 1502/2000 [02:26<00:49, 10.16it/s]

Training_loss 2.25304,   Relative Error 0.56684
Training_loss 2.25532,   Relative Error 0.56715
Training_loss 2.25323,   Relative Error 0.56691


 75%|███████▌  | 1504/2000 [02:26<00:45, 10.87it/s]

Training_loss 2.25852,   Relative Error 0.56759
Training_loss 2.25870,   Relative Error 0.56758
Training_loss 2.26159,   Relative Error 0.56789


 75%|███████▌  | 1508/2000 [02:27<00:41, 11.89it/s]

Training_loss 2.26091,   Relative Error 0.56778
Training_loss 2.25835,   Relative Error 0.56743
Training_loss 2.26118,   Relative Error 0.56774


 76%|███████▌  | 1510/2000 [02:27<00:40, 12.11it/s]

Training_loss 2.25695,   Relative Error 0.56723
Training_loss 2.25777,   Relative Error 0.56732
Training_loss 2.26037,   Relative Error 0.56762


 76%|███████▌  | 1514/2000 [02:27<00:39, 12.32it/s]

Training_loss 2.26181,   Relative Error 0.56782
Training_loss 2.26028,   Relative Error 0.56762
Training_loss 2.26640,   Relative Error 0.56835


 76%|███████▌  | 1516/2000 [02:27<00:39, 12.24it/s]

Training_loss 2.27277,   Relative Error 0.56913
Training_loss 2.27220,   Relative Error 0.56908
Training_loss 2.27727,   Relative Error 0.56969


 76%|███████▌  | 1520/2000 [02:28<00:41, 11.51it/s]

Training_loss 2.27842,   Relative Error 0.56980
Training_loss 2.28211,   Relative Error 0.57026
Training_loss 2.27776,   Relative Error 0.56971


 76%|███████▌  | 1522/2000 [02:28<00:42, 11.31it/s]

Training_loss 2.27467,   Relative Error 0.56929
Training_loss 2.28028,   Relative Error 0.56998
Training_loss 2.28170,   Relative Error 0.57011


 76%|███████▋  | 1526/2000 [02:28<00:41, 11.47it/s]

Training_loss 2.27976,   Relative Error 0.56981
Training_loss 2.28143,   Relative Error 0.57002
Training_loss 2.28598,   Relative Error 0.57059


 76%|███████▋  | 1528/2000 [02:28<00:40, 11.68it/s]

Training_loss 2.29183,   Relative Error 0.57132
Training_loss 2.29017,   Relative Error 0.57111
Training_loss 2.29309,   Relative Error 0.57146


 77%|███████▋  | 1532/2000 [02:29<00:37, 12.38it/s]

Training_loss 2.29580,   Relative Error 0.57176
Training_loss 2.29453,   Relative Error 0.57165
Training_loss 2.30155,   Relative Error 0.57250


 77%|███████▋  | 1534/2000 [02:29<00:38, 12.11it/s]

Training_loss 2.30456,   Relative Error 0.57282
Training_loss 2.30969,   Relative Error 0.57345
Training_loss 2.31496,   Relative Error 0.57409


 77%|███████▋  | 1538/2000 [02:29<00:37, 12.40it/s]

Training_loss 2.32048,   Relative Error 0.57477
Training_loss 2.32774,   Relative Error 0.57566
Training_loss 2.33146,   Relative Error 0.57612


 77%|███████▋  | 1540/2000 [02:29<00:36, 12.49it/s]

Training_loss 2.33444,   Relative Error 0.57650
Training_loss 2.34126,   Relative Error 0.57733
Training_loss 2.34666,   Relative Error 0.57798


 77%|███████▋  | 1542/2000 [02:30<00:37, 12.29it/s]

Training_loss 2.34815,   Relative Error 0.57815
Training_loss 2.35232,   Relative Error 0.57865


 77%|███████▋  | 1544/2000 [02:30<00:41, 11.04it/s]

Training_loss 2.35483,   Relative Error 0.57889
Training_loss 2.35914,   Relative Error 0.57937


 77%|███████▋  | 1546/2000 [02:30<01:09,  6.56it/s]

Training_loss 2.36479,   Relative Error 0.58004


 77%|███████▋  | 1549/2000 [02:31<01:02,  7.21it/s]

Training_loss 2.36853,   Relative Error 0.58043
Training_loss 2.37376,   Relative Error 0.58103
Training_loss 2.37152,   Relative Error 0.58073


 78%|███████▊  | 1551/2000 [02:31<00:53,  8.39it/s]

Training_loss 2.37187,   Relative Error 0.58072
Training_loss 2.37635,   Relative Error 0.58125
Training_loss 2.37516,   Relative Error 0.58109


 78%|███████▊  | 1555/2000 [02:31<00:42, 10.38it/s]

Training_loss 2.37551,   Relative Error 0.58110
Training_loss 2.38183,   Relative Error 0.58184
Training_loss 2.38065,   Relative Error 0.58173


 78%|███████▊  | 1557/2000 [02:31<00:39, 11.16it/s]

Training_loss 2.38346,   Relative Error 0.58207
Training_loss 2.38416,   Relative Error 0.58220
Training_loss 2.39247,   Relative Error 0.58320


 78%|███████▊  | 1561/2000 [02:32<00:39, 11.20it/s]

Training_loss 2.39485,   Relative Error 0.58351
Training_loss 2.39812,   Relative Error 0.58392
Training_loss 2.40072,   Relative Error 0.58419


 78%|███████▊  | 1563/2000 [02:32<00:38, 11.46it/s]

Training_loss 2.40515,   Relative Error 0.58470
Training_loss 2.40763,   Relative Error 0.58495
Training_loss 2.40919,   Relative Error 0.58514


 78%|███████▊  | 1567/2000 [02:32<00:38, 11.29it/s]

Training_loss 2.41397,   Relative Error 0.58569
Training_loss 2.40831,   Relative Error 0.58505
Training_loss 2.41297,   Relative Error 0.58556
Training_loss 2.41420,   Relative Error 0.58572


 78%|███████▊  | 1569/2000 [02:33<00:48,  8.84it/s]

Training_loss 2.41568,   Relative Error 0.58582
Training_loss 2.42207,   Relative Error 0.58655


 79%|███████▊  | 1572/2000 [02:33<01:02,  6.84it/s]

Training_loss 2.42485,   Relative Error 0.58685
Training_loss 2.42739,   Relative Error 0.58713


 79%|███████▊  | 1574/2000 [02:33<01:03,  6.72it/s]

Training_loss 2.42654,   Relative Error 0.58701
Training_loss 2.42720,   Relative Error 0.58706


 79%|███████▉  | 1576/2000 [02:34<00:59,  7.15it/s]

Training_loss 2.43159,   Relative Error 0.58756
Training_loss 2.43397,   Relative Error 0.58779


 79%|███████▉  | 1578/2000 [02:34<01:01,  6.83it/s]

Training_loss 2.43966,   Relative Error 0.58844
Training_loss 2.44380,   Relative Error 0.58894


 79%|███████▉  | 1580/2000 [02:34<01:17,  5.43it/s]

Training_loss 2.44729,   Relative Error 0.58933
Training_loss 2.44630,   Relative Error 0.58922


 79%|███████▉  | 1581/2000 [02:35<01:11,  5.84it/s]

Training_loss 2.44677,   Relative Error 0.58926
Training_loss 2.44986,   Relative Error 0.58958


 79%|███████▉  | 1583/2000 [02:35<01:02,  6.66it/s]

Training_loss 2.45707,   Relative Error 0.59041


 79%|███████▉  | 1585/2000 [02:35<01:09,  5.97it/s]

Training_loss 2.45626,   Relative Error 0.59025
Training_loss 2.45971,   Relative Error 0.59066


 79%|███████▉  | 1587/2000 [02:36<01:12,  5.66it/s]

Training_loss 2.46097,   Relative Error 0.59081
Training_loss 2.46741,   Relative Error 0.59155


 79%|███████▉  | 1589/2000 [02:36<01:14,  5.48it/s]

Training_loss 2.46548,   Relative Error 0.59130
Training_loss 2.47143,   Relative Error 0.59197


 80%|███████▉  | 1591/2000 [02:36<01:12,  5.61it/s]

Training_loss 2.47746,   Relative Error 0.59268
Training_loss 2.47813,   Relative Error 0.59269


 80%|███████▉  | 1592/2000 [02:37<01:26,  4.70it/s]

Training_loss 2.48382,   Relative Error 0.59337


 80%|███████▉  | 1593/2000 [02:37<01:28,  4.58it/s]

Training_loss 2.48140,   Relative Error 0.59310
Training_loss 2.48763,   Relative Error 0.59383

 80%|███████▉  | 1595/2000 [02:37<01:19,  5.08it/s]


Training_loss 2.49160,   Relative Error 0.59429


 80%|███████▉  | 1596/2000 [02:37<01:11,  5.67it/s]

Training_loss 2.49768,   Relative Error 0.59497


 80%|███████▉  | 1598/2000 [02:38<01:04,  6.21it/s]

Training_loss 2.49863,   Relative Error 0.59512
Training_loss 2.50214,   Relative Error 0.59550


 80%|████████  | 1600/2000 [02:38<00:58,  6.81it/s]

Training_loss 2.50605,   Relative Error 0.59595
Training_loss 2.50568,   Relative Error 0.59592


 80%|████████  | 1602/2000 [02:38<00:51,  7.76it/s]

Training_loss 2.50801,   Relative Error 0.59614
Training_loss 2.50726,   Relative Error 0.59601


 80%|████████  | 1604/2000 [02:38<00:47,  8.32it/s]

Training_loss 2.51126,   Relative Error 0.59649
Training_loss 2.50892,   Relative Error 0.59620


 80%|████████  | 1605/2000 [02:39<00:47,  8.28it/s]

Training_loss 2.51053,   Relative Error 0.59636
Training_loss 2.51512,   Relative Error 0.59686


 80%|████████  | 1608/2000 [02:39<00:44,  8.84it/s]

Training_loss 2.51546,   Relative Error 0.59688
Training_loss 2.51868,   Relative Error 0.59725


 80%|████████  | 1610/2000 [02:39<00:44,  8.79it/s]

Training_loss 2.51935,   Relative Error 0.59735
Training_loss 2.52205,   Relative Error 0.59767


 81%|████████  | 1612/2000 [02:39<00:52,  7.32it/s]

Training_loss 2.52076,   Relative Error 0.59753
Training_loss 2.52441,   Relative Error 0.59796


 81%|████████  | 1613/2000 [02:40<00:57,  6.77it/s]

Training_loss 2.52498,   Relative Error 0.59801


 81%|████████  | 1615/2000 [02:40<00:56,  6.79it/s]

Training_loss 2.52979,   Relative Error 0.59861
Training_loss 2.53311,   Relative Error 0.59896


 81%|████████  | 1617/2000 [02:40<00:58,  6.55it/s]

Training_loss 2.53994,   Relative Error 0.59972
Training_loss 2.54305,   Relative Error 0.60004


 81%|████████  | 1619/2000 [02:40<00:57,  6.63it/s]

Training_loss 2.54338,   Relative Error 0.60007
Training_loss 2.54992,   Relative Error 0.60084


 81%|████████  | 1621/2000 [02:41<00:45,  8.35it/s]

Training_loss 2.55260,   Relative Error 0.60116
Training_loss 2.55652,   Relative Error 0.60159
Training_loss 2.56375,   Relative Error 0.60238


 81%|████████  | 1624/2000 [02:41<00:43,  8.67it/s]

Training_loss 2.56415,   Relative Error 0.60250
Training_loss 2.56530,   Relative Error 0.60265


 81%|████████▏ | 1626/2000 [02:41<00:47,  7.94it/s]

Training_loss 2.56390,   Relative Error 0.60245
Training_loss 2.56381,   Relative Error 0.60242
Training_loss 2.56555,   Relative Error 0.60255


 82%|████████▏ | 1630/2000 [02:42<00:34, 10.61it/s]

Training_loss 2.56702,   Relative Error 0.60268
Training_loss 2.56963,   Relative Error 0.60300
Training_loss 2.57128,   Relative Error 0.60318


 82%|████████▏ | 1632/2000 [02:42<00:34, 10.60it/s]

Training_loss 2.57645,   Relative Error 0.60377
Training_loss 2.58272,   Relative Error 0.60448


 82%|████████▏ | 1634/2000 [02:42<00:36, 10.02it/s]

Training_loss 2.58072,   Relative Error 0.60426
Training_loss 2.58482,   Relative Error 0.60472
Training_loss 2.58407,   Relative Error 0.60465


 82%|████████▏ | 1638/2000 [02:42<00:32, 11.09it/s]

Training_loss 2.58597,   Relative Error 0.60487
Training_loss 2.58982,   Relative Error 0.60531
Training_loss 2.59064,   Relative Error 0.60535


 82%|████████▏ | 1640/2000 [02:42<00:32, 10.95it/s]

Training_loss 2.59004,   Relative Error 0.60531
Training_loss 2.59336,   Relative Error 0.60571
Training_loss 2.59140,   Relative Error 0.60544


 82%|████████▏ | 1644/2000 [02:43<00:33, 10.66it/s]

Training_loss 2.59662,   Relative Error 0.60600
Training_loss 2.59626,   Relative Error 0.60597
Training_loss 2.59764,   Relative Error 0.60603


 82%|████████▏ | 1646/2000 [02:43<00:32, 10.93it/s]

Training_loss 2.59895,   Relative Error 0.60615
Training_loss 2.59920,   Relative Error 0.60616
Training_loss 2.60498,   Relative Error 0.60683


 82%|████████▎ | 1650/2000 [02:43<00:33, 10.38it/s]

Training_loss 2.60653,   Relative Error 0.60703
Training_loss 2.60974,   Relative Error 0.60741
Training_loss 2.61387,   Relative Error 0.60790


 83%|████████▎ | 1652/2000 [02:44<00:33, 10.29it/s]

Training_loss 2.61681,   Relative Error 0.60818
Training_loss 2.62079,   Relative Error 0.60866
Training_loss 2.62435,   Relative Error 0.60902


 83%|████████▎ | 1656/2000 [02:44<00:32, 10.74it/s]

Training_loss 2.62928,   Relative Error 0.60958
Training_loss 2.63182,   Relative Error 0.60985
Training_loss 2.63719,   Relative Error 0.61045


 83%|████████▎ | 1658/2000 [02:44<00:30, 11.22it/s]

Training_loss 2.63612,   Relative Error 0.61033
Training_loss 2.64211,   Relative Error 0.61096
Training_loss 2.64103,   Relative Error 0.61083


 83%|████████▎ | 1662/2000 [02:44<00:28, 11.84it/s]

Training_loss 2.64172,   Relative Error 0.61097
Training_loss 2.64010,   Relative Error 0.61079
Training_loss 2.63803,   Relative Error 0.61060


 83%|████████▎ | 1664/2000 [02:45<00:30, 11.15it/s]

Training_loss 2.63082,   Relative Error 0.60972
Training_loss 2.63610,   Relative Error 0.61030
Training_loss 2.64056,   Relative Error 0.61079


 83%|████████▎ | 1668/2000 [02:45<00:29, 11.14it/s]

Training_loss 2.63937,   Relative Error 0.61063
Training_loss 2.63976,   Relative Error 0.61065
Training_loss 2.64142,   Relative Error 0.61080


 84%|████████▎ | 1670/2000 [02:45<00:28, 11.54it/s]

Training_loss 2.64594,   Relative Error 0.61131
Training_loss 2.64902,   Relative Error 0.61170
Training_loss 2.65177,   Relative Error 0.61199


 84%|████████▎ | 1674/2000 [02:46<00:27, 11.75it/s]

Training_loss 2.65286,   Relative Error 0.61211
Training_loss 2.64820,   Relative Error 0.61155
Training_loss 2.65057,   Relative Error 0.61177


 84%|████████▍ | 1676/2000 [02:46<00:27, 11.91it/s]

Training_loss 2.65685,   Relative Error 0.61244
Training_loss 2.65969,   Relative Error 0.61281
Training_loss 2.66022,   Relative Error 0.61288


 84%|████████▍ | 1678/2000 [02:46<00:28, 11.25it/s]

Training_loss 2.66579,   Relative Error 0.61350
Training_loss 2.66730,   Relative Error 0.61370


 84%|████████▍ | 1682/2000 [02:46<00:28, 11.14it/s]

Training_loss 2.67285,   Relative Error 0.61432
Training_loss 2.67657,   Relative Error 0.61473
Training_loss 2.67701,   Relative Error 0.61479


 84%|████████▍ | 1684/2000 [02:46<00:30, 10.50it/s]

Training_loss 2.68101,   Relative Error 0.61523
Training_loss 2.68283,   Relative Error 0.61537
Training_loss 2.68888,   Relative Error 0.61607


 84%|████████▍ | 1688/2000 [02:47<00:28, 10.96it/s]

Training_loss 2.69027,   Relative Error 0.61621
Training_loss 2.69586,   Relative Error 0.61684
Training_loss 2.69526,   Relative Error 0.61676


 84%|████████▍ | 1690/2000 [02:47<00:28, 10.80it/s]

Training_loss 2.69727,   Relative Error 0.61699
Training_loss 2.69955,   Relative Error 0.61726


 85%|████████▍ | 1692/2000 [02:47<00:28, 10.86it/s]

Training_loss 2.69773,   Relative Error 0.61702
Training_loss 2.70144,   Relative Error 0.61739
Training_loss 2.70844,   Relative Error 0.61816


 85%|████████▍ | 1696/2000 [02:48<00:28, 10.69it/s]

Training_loss 2.70897,   Relative Error 0.61823
Training_loss 2.71468,   Relative Error 0.61887
Training_loss 2.71766,   Relative Error 0.61925


 85%|████████▍ | 1698/2000 [02:48<00:27, 10.88it/s]

Training_loss 2.72483,   Relative Error 0.62006
Training_loss 2.72693,   Relative Error 0.62032
Training_loss 2.72871,   Relative Error 0.62047


 85%|████████▌ | 1702/2000 [02:48<00:26, 11.33it/s]

Training_loss 2.73180,   Relative Error 0.62081
Training_loss 2.73397,   Relative Error 0.62104
Training_loss 2.73684,   Relative Error 0.62136


 85%|████████▌ | 1704/2000 [02:48<00:27, 10.74it/s]

Training_loss 2.74255,   Relative Error 0.62202
Training_loss 2.74576,   Relative Error 0.62242


 85%|████████▌ | 1706/2000 [02:49<00:28, 10.20it/s]

Training_loss 2.74601,   Relative Error 0.62248
Training_loss 2.74955,   Relative Error 0.62289
Training_loss 2.74991,   Relative Error 0.62286


 85%|████████▌ | 1708/2000 [02:49<00:28, 10.37it/s]

Training_loss 2.74165,   Relative Error 0.62193
Training_loss 2.73870,   Relative Error 0.62161


 86%|████████▌ | 1712/2000 [02:49<00:28, 10.11it/s]

Training_loss 2.73447,   Relative Error 0.62111
Training_loss 2.73180,   Relative Error 0.62084
Training_loss 2.73555,   Relative Error 0.62127


 86%|████████▌ | 1714/2000 [02:49<00:27, 10.43it/s]

Training_loss 2.73896,   Relative Error 0.62168
Training_loss 2.74671,   Relative Error 0.62255
Training_loss 2.74695,   Relative Error 0.62257


 86%|████████▌ | 1718/2000 [02:50<00:26, 10.46it/s]

Training_loss 2.74830,   Relative Error 0.62268
Training_loss 2.75516,   Relative Error 0.62343
Training_loss 2.75371,   Relative Error 0.62326


 86%|████████▌ | 1720/2000 [02:50<00:25, 10.95it/s]

Training_loss 2.75949,   Relative Error 0.62389
Training_loss 2.76536,   Relative Error 0.62455
Training_loss 2.77231,   Relative Error 0.62527


 86%|████████▌ | 1724/2000 [02:50<00:24, 11.24it/s]

Training_loss 2.77226,   Relative Error 0.62525
Training_loss 2.77482,   Relative Error 0.62545
Training_loss 2.77651,   Relative Error 0.62554


 86%|████████▋ | 1726/2000 [02:50<00:24, 11.10it/s]

Training_loss 2.77891,   Relative Error 0.62579
Training_loss 2.78084,   Relative Error 0.62601
Training_loss 2.78078,   Relative Error 0.62596


 86%|████████▋ | 1730/2000 [02:51<00:23, 11.40it/s]

Training_loss 2.78980,   Relative Error 0.62695
Training_loss 2.79340,   Relative Error 0.62732
Training_loss 2.79099,   Relative Error 0.62701


 87%|████████▋ | 1732/2000 [02:51<00:23, 11.59it/s]

Training_loss 2.78806,   Relative Error 0.62679
Training_loss 2.79374,   Relative Error 0.62743
Training_loss 2.79065,   Relative Error 0.62710


 87%|████████▋ | 1736/2000 [02:51<00:23, 11.42it/s]

Training_loss 2.79644,   Relative Error 0.62774
Training_loss 2.79592,   Relative Error 0.62763
Training_loss 2.79966,   Relative Error 0.62802


 87%|████████▋ | 1738/2000 [02:51<00:23, 11.09it/s]

Training_loss 2.80496,   Relative Error 0.62858
Training_loss 2.80477,   Relative Error 0.62856
Training_loss 2.80380,   Relative Error 0.62842


 87%|████████▋ | 1742/2000 [02:52<00:23, 10.94it/s]

Training_loss 2.80729,   Relative Error 0.62877
Training_loss 2.81227,   Relative Error 0.62930
Training_loss 2.81768,   Relative Error 0.62991


 87%|████████▋ | 1744/2000 [02:52<00:23, 10.89it/s]

Training_loss 2.82177,   Relative Error 0.63030
Training_loss 2.82549,   Relative Error 0.63069
Training_loss 2.82768,   Relative Error 0.63096


 87%|████████▋ | 1748/2000 [02:52<00:23, 10.68it/s]

Training_loss 2.82380,   Relative Error 0.63054
Training_loss 2.82762,   Relative Error 0.63097
Training_loss 2.83045,   Relative Error 0.63128


 88%|████████▊ | 1750/2000 [02:53<00:23, 10.55it/s]

Training_loss 2.83295,   Relative Error 0.63151
Training_loss 2.83412,   Relative Error 0.63168
Training_loss 2.83479,   Relative Error 0.63176


 88%|████████▊ | 1754/2000 [02:53<00:22, 10.93it/s]

Training_loss 2.83880,   Relative Error 0.63222
Training_loss 2.84335,   Relative Error 0.63271
Training_loss 2.84745,   Relative Error 0.63314


 88%|████████▊ | 1756/2000 [02:53<00:22, 10.80it/s]

Training_loss 2.85123,   Relative Error 0.63354
Training_loss 2.85748,   Relative Error 0.63421
Training_loss 2.86115,   Relative Error 0.63461


 88%|████████▊ | 1760/2000 [02:53<00:21, 11.07it/s]

Training_loss 2.85800,   Relative Error 0.63420
Training_loss 2.85842,   Relative Error 0.63426
Training_loss 2.86112,   Relative Error 0.63458


 88%|████████▊ | 1762/2000 [02:54<00:20, 11.33it/s]

Training_loss 2.86643,   Relative Error 0.63516
Training_loss 2.86772,   Relative Error 0.63527


 88%|████████▊ | 1764/2000 [02:54<00:23, 10.23it/s]

Training_loss 2.86845,   Relative Error 0.63536
Training_loss 2.86939,   Relative Error 0.63538
Training_loss 2.87631,   Relative Error 0.63613


 88%|████████▊ | 1766/2000 [02:54<00:22, 10.23it/s]

Training_loss 2.87438,   Relative Error 0.63594
Training_loss 2.87577,   Relative Error 0.63610


 88%|████████▊ | 1768/2000 [02:54<00:23,  9.82it/s]

Training_loss 2.87939,   Relative Error 0.63649
Training_loss 2.88359,   Relative Error 0.63694


 89%|████████▊ | 1771/2000 [02:55<00:24,  9.40it/s]

Training_loss 2.88641,   Relative Error 0.63722
Training_loss 2.89165,   Relative Error 0.63779
Training_loss 2.89806,   Relative Error 0.63844


 89%|████████▉ | 1775/2000 [02:55<00:21, 10.46it/s]

Training_loss 2.89534,   Relative Error 0.63815
Training_loss 2.90263,   Relative Error 0.63890
Training_loss 2.90454,   Relative Error 0.63913


 89%|████████▉ | 1777/2000 [02:55<00:21, 10.24it/s]

Training_loss 2.90889,   Relative Error 0.63961
Training_loss 2.90702,   Relative Error 0.63942


 89%|████████▉ | 1779/2000 [02:55<00:21, 10.47it/s]

Training_loss 2.90578,   Relative Error 0.63927
Training_loss 2.90277,   Relative Error 0.63889
Training_loss 2.90413,   Relative Error 0.63901


 89%|████████▉ | 1783/2000 [02:56<00:20, 10.66it/s]

Training_loss 2.91003,   Relative Error 0.63961
Training_loss 2.91152,   Relative Error 0.63978
Training_loss 2.91166,   Relative Error 0.63981


 89%|████████▉ | 1785/2000 [02:56<00:20, 10.39it/s]

Training_loss 2.90752,   Relative Error 0.63942
Training_loss 2.91002,   Relative Error 0.63968


 89%|████████▉ | 1787/2000 [02:56<00:19, 10.67it/s]

Training_loss 2.90989,   Relative Error 0.63964
Training_loss 2.90518,   Relative Error 0.63905
Training_loss 2.91047,   Relative Error 0.63964


 90%|████████▉ | 1791/2000 [02:56<00:18, 11.31it/s]

Training_loss 2.90884,   Relative Error 0.63945
Training_loss 2.91269,   Relative Error 0.63985
Training_loss 2.91409,   Relative Error 0.63996


 90%|████████▉ | 1793/2000 [02:57<00:19, 10.67it/s]

Training_loss 2.91465,   Relative Error 0.63998
Training_loss 2.91809,   Relative Error 0.64032


 90%|████████▉ | 1795/2000 [02:57<00:19, 10.33it/s]

Training_loss 2.91170,   Relative Error 0.63967
Training_loss 2.91514,   Relative Error 0.64001
Training_loss 2.91974,   Relative Error 0.64051


 90%|████████▉ | 1799/2000 [02:57<00:18, 10.83it/s]

Training_loss 2.92182,   Relative Error 0.64074
Training_loss 2.91848,   Relative Error 0.64040
Training_loss 2.92116,   Relative Error 0.64066


 90%|█████████ | 1801/2000 [02:57<00:18, 10.76it/s]

Training_loss 2.92344,   Relative Error 0.64087
Training_loss 2.92846,   Relative Error 0.64139
Training_loss 2.92778,   Relative Error 0.64131


 90%|█████████ | 1805/2000 [02:58<00:17, 11.09it/s]

Training_loss 2.93001,   Relative Error 0.64156
Training_loss 2.92925,   Relative Error 0.64152
Training_loss 2.93131,   Relative Error 0.64174


 90%|█████████ | 1807/2000 [02:58<00:18, 10.19it/s]

Training_loss 2.93039,   Relative Error 0.64164
Training_loss 2.92725,   Relative Error 0.64124


 90%|█████████ | 1809/2000 [02:58<00:18, 10.30it/s]

Training_loss 2.93103,   Relative Error 0.64167
Training_loss 2.93689,   Relative Error 0.64231
Training_loss 2.93773,   Relative Error 0.64239


 91%|█████████ | 1813/2000 [02:59<00:18, 10.10it/s]

Training_loss 2.94414,   Relative Error 0.64305
Training_loss 2.94934,   Relative Error 0.64360
Training_loss 2.95556,   Relative Error 0.64427


 91%|█████████ | 1815/2000 [02:59<00:17, 10.58it/s]

Training_loss 2.95271,   Relative Error 0.64401
Training_loss 2.95771,   Relative Error 0.64456
Training_loss 2.95885,   Relative Error 0.64471


 91%|█████████ | 1819/2000 [02:59<00:17, 10.64it/s]

Training_loss 2.96133,   Relative Error 0.64498
Training_loss 2.96527,   Relative Error 0.64541
Training_loss 2.96619,   Relative Error 0.64547


 91%|█████████ | 1821/2000 [02:59<00:16, 10.77it/s]

Training_loss 2.96688,   Relative Error 0.64547
Training_loss 2.96758,   Relative Error 0.64555
Training_loss 2.96751,   Relative Error 0.64556


 91%|█████████▏| 1825/2000 [03:00<00:16, 10.86it/s]

Training_loss 2.96488,   Relative Error 0.64527
Training_loss 2.97033,   Relative Error 0.64586
Training_loss 2.97019,   Relative Error 0.64587


 91%|█████████▏| 1827/2000 [03:00<00:16, 10.75it/s]

Training_loss 2.97356,   Relative Error 0.64619
Training_loss 2.97419,   Relative Error 0.64620
Training_loss 2.97805,   Relative Error 0.64660


 91%|█████████▏| 1829/2000 [03:00<00:15, 11.02it/s]

Training_loss 2.98060,   Relative Error 0.64685
Training_loss 2.97813,   Relative Error 0.64656


 92%|█████████▏| 1833/2000 [03:00<00:16, 10.42it/s]

Training_loss 2.97852,   Relative Error 0.64662
Training_loss 2.98031,   Relative Error 0.64678
Training_loss 2.98207,   Relative Error 0.64691


 92%|█████████▏| 1835/2000 [03:01<00:16,  9.86it/s]

Training_loss 2.98699,   Relative Error 0.64746
Training_loss 2.98092,   Relative Error 0.64688


 92%|█████████▏| 1837/2000 [03:01<00:18,  8.76it/s]

Training_loss 2.98410,   Relative Error 0.64719
Training_loss 2.98443,   Relative Error 0.64721


 92%|█████████▏| 1840/2000 [03:01<00:17,  8.97it/s]

Training_loss 2.98958,   Relative Error 0.64781
Training_loss 2.99266,   Relative Error 0.64816
Training_loss 2.99007,   Relative Error 0.64782


 92%|█████████▏| 1842/2000 [03:02<00:17,  9.05it/s]

Training_loss 2.98929,   Relative Error 0.64771
Training_loss 2.98937,   Relative Error 0.64769


 92%|█████████▏| 1845/2000 [03:02<00:16,  9.67it/s]

Training_loss 2.98714,   Relative Error 0.64750
Training_loss 2.99191,   Relative Error 0.64794
Training_loss 2.98750,   Relative Error 0.64747


 92%|█████████▏| 1848/2000 [03:02<00:14, 10.35it/s]

Training_loss 2.99246,   Relative Error 0.64796
Training_loss 2.99648,   Relative Error 0.64841
Training_loss 3.00008,   Relative Error 0.64881


 92%|█████████▎| 1850/2000 [03:02<00:13, 11.09it/s]

Training_loss 3.00271,   Relative Error 0.64903
Training_loss 3.00946,   Relative Error 0.64972


 93%|█████████▎| 1852/2000 [03:02<00:14, 10.10it/s]

Training_loss 3.01216,   Relative Error 0.64999
Training_loss 3.01433,   Relative Error 0.65023
Training_loss 3.01509,   Relative Error 0.65018


 93%|█████████▎| 1856/2000 [03:03<00:12, 11.62it/s]

Training_loss 3.02030,   Relative Error 0.65075
Training_loss 3.02426,   Relative Error 0.65115
Training_loss 3.03143,   Relative Error 0.65186


 93%|█████████▎| 1858/2000 [03:03<00:11, 12.22it/s]

Training_loss 3.03813,   Relative Error 0.65255
Training_loss 3.04041,   Relative Error 0.65282
Training_loss 3.03800,   Relative Error 0.65258


 93%|█████████▎| 1862/2000 [03:03<00:10, 12.76it/s]

Training_loss 3.03457,   Relative Error 0.65226
Training_loss 3.04086,   Relative Error 0.65291
Training_loss 3.04517,   Relative Error 0.65336


 93%|█████████▎| 1864/2000 [03:03<00:10, 12.87it/s]

Training_loss 3.05465,   Relative Error 0.65431
Training_loss 3.05437,   Relative Error 0.65422
Training_loss 3.05419,   Relative Error 0.65425


 93%|█████████▎| 1868/2000 [03:04<00:11, 11.85it/s]

Training_loss 3.05336,   Relative Error 0.65417
Training_loss 3.05596,   Relative Error 0.65447
Training_loss 3.05156,   Relative Error 0.65393


 94%|█████████▎| 1870/2000 [03:04<00:11, 11.30it/s]

Training_loss 3.05923,   Relative Error 0.65472
Training_loss 3.06424,   Relative Error 0.65528
Training_loss 3.06647,   Relative Error 0.65549


 94%|█████████▎| 1874/2000 [03:04<00:11, 10.96it/s]

Training_loss 3.07193,   Relative Error 0.65607
Training_loss 3.07132,   Relative Error 0.65602
Training_loss 3.07223,   Relative Error 0.65610


 94%|█████████▍| 1876/2000 [03:05<00:13,  9.39it/s]

Training_loss 3.07449,   Relative Error 0.65635
Training_loss 3.06949,   Relative Error 0.65588
Training_loss 3.07437,   Relative Error 0.65639


 94%|█████████▍| 1880/2000 [03:05<00:11, 10.35it/s]

Training_loss 3.08070,   Relative Error 0.65704
Training_loss 3.08586,   Relative Error 0.65760
Training_loss 3.08360,   Relative Error 0.65734


 94%|█████████▍| 1882/2000 [03:05<00:11, 10.07it/s]

Training_loss 3.09014,   Relative Error 0.65795
Training_loss 3.09480,   Relative Error 0.65845
Training_loss 3.10095,   Relative Error 0.65912


 94%|█████████▍| 1884/2000 [03:05<00:10, 10.57it/s]

Training_loss 3.10328,   Relative Error 0.65933
Training_loss 3.10769,   Relative Error 0.65977


 94%|█████████▍| 1886/2000 [03:06<00:11,  9.97it/s]

Training_loss 3.10814,   Relative Error 0.65980
Training_loss 3.10432,   Relative Error 0.65944


 94%|█████████▍| 1890/2000 [03:06<00:11,  9.68it/s]

Training_loss 3.10416,   Relative Error 0.65934
Training_loss 3.10517,   Relative Error 0.65942
Training_loss 3.10226,   Relative Error 0.65917


 95%|█████████▍| 1892/2000 [03:06<00:10, 10.00it/s]

Training_loss 3.11027,   Relative Error 0.66000
Training_loss 3.10822,   Relative Error 0.65982
Training_loss 3.11085,   Relative Error 0.66009


 95%|█████████▍| 1896/2000 [03:07<00:10, 10.22it/s]

Training_loss 3.11598,   Relative Error 0.66064
Training_loss 3.11394,   Relative Error 0.66049
Training_loss 3.11687,   Relative Error 0.66082


 95%|█████████▍| 1898/2000 [03:07<00:10, 10.06it/s]

Training_loss 3.12358,   Relative Error 0.66149
Training_loss 3.11818,   Relative Error 0.66086
Training_loss 3.11469,   Relative Error 0.66049


 95%|█████████▌| 1902/2000 [03:07<00:09, 10.52it/s]

Training_loss 3.11645,   Relative Error 0.66065
Training_loss 3.12207,   Relative Error 0.66125
Training_loss 3.12324,   Relative Error 0.66137


 95%|█████████▌| 1904/2000 [03:07<00:09, 10.42it/s]

Training_loss 3.11648,   Relative Error 0.66072
Training_loss 3.11882,   Relative Error 0.66095
Training_loss 3.12222,   Relative Error 0.66135


 95%|█████████▌| 1908/2000 [03:08<00:08, 10.53it/s]

Training_loss 3.12034,   Relative Error 0.66115
Training_loss 3.12629,   Relative Error 0.66178
Training_loss 3.13365,   Relative Error 0.66251


 96%|█████████▌| 1910/2000 [03:08<00:08, 10.85it/s]

Training_loss 3.13992,   Relative Error 0.66312
Training_loss 3.14151,   Relative Error 0.66329
Training_loss 3.14428,   Relative Error 0.66359


 96%|█████████▌| 1914/2000 [03:08<00:07, 11.57it/s]

Training_loss 3.14923,   Relative Error 0.66413
Training_loss 3.15256,   Relative Error 0.66447
Training_loss 3.15309,   Relative Error 0.66446


 96%|█████████▌| 1916/2000 [03:08<00:07, 11.86it/s]

Training_loss 3.15386,   Relative Error 0.66453
Training_loss 3.14907,   Relative Error 0.66409


 96%|█████████▌| 1918/2000 [03:09<00:07, 10.49it/s]

Training_loss 3.14969,   Relative Error 0.66412
Training_loss 3.14653,   Relative Error 0.66380
Training_loss 3.14450,   Relative Error 0.66363


 96%|█████████▌| 1922/2000 [03:09<00:07, 11.06it/s]

Training_loss 3.14620,   Relative Error 0.66381
Training_loss 3.14670,   Relative Error 0.66383
Training_loss 3.14814,   Relative Error 0.66396


 96%|█████████▌| 1924/2000 [03:09<00:06, 11.34it/s]

Training_loss 3.15259,   Relative Error 0.66444
Training_loss 3.15679,   Relative Error 0.66486
Training_loss 3.15177,   Relative Error 0.66432


 96%|█████████▋| 1928/2000 [03:09<00:06, 11.34it/s]

Training_loss 3.15302,   Relative Error 0.66446
Training_loss 3.15866,   Relative Error 0.66501
Training_loss 3.16370,   Relative Error 0.66558


 96%|█████████▋| 1930/2000 [03:10<00:06, 10.11it/s]

Training_loss 3.16140,   Relative Error 0.66533
Training_loss 3.15537,   Relative Error 0.66474


 97%|█████████▋| 1932/2000 [03:10<00:06,  9.92it/s]

Training_loss 3.16122,   Relative Error 0.66536
Training_loss 3.15963,   Relative Error 0.66512
Training_loss 3.16662,   Relative Error 0.66583


 97%|█████████▋| 1936/2000 [03:10<00:06, 10.62it/s]

Training_loss 3.16303,   Relative Error 0.66548
Training_loss 3.16291,   Relative Error 0.66545
Training_loss 3.16302,   Relative Error 0.66542


 97%|█████████▋| 1938/2000 [03:10<00:05, 10.93it/s]

Training_loss 3.16719,   Relative Error 0.66578
Training_loss 3.17560,   Relative Error 0.66667
Training_loss 3.17044,   Relative Error 0.66621


 97%|█████████▋| 1942/2000 [03:11<00:05, 10.77it/s]

Training_loss 3.17337,   Relative Error 0.66648
Training_loss 3.17339,   Relative Error 0.66649
Training_loss 3.17822,   Relative Error 0.66696


 97%|█████████▋| 1944/2000 [03:11<00:05, 10.73it/s]

Training_loss 3.17740,   Relative Error 0.66684
Training_loss 3.18506,   Relative Error 0.66760
Training_loss 3.18950,   Relative Error 0.66806


 97%|█████████▋| 1948/2000 [03:11<00:05,  9.93it/s]

Training_loss 3.18165,   Relative Error 0.66723
Training_loss 3.18529,   Relative Error 0.66759
Training_loss 3.19026,   Relative Error 0.66809


 98%|█████████▊| 1950/2000 [03:12<00:04, 10.29it/s]

Training_loss 3.19277,   Relative Error 0.66837
Training_loss 3.20044,   Relative Error 0.66915
Training_loss 3.19894,   Relative Error 0.66892


 98%|█████████▊| 1954/2000 [03:12<00:04, 10.35it/s]

Training_loss 3.19918,   Relative Error 0.66890
Training_loss 3.20340,   Relative Error 0.66930
Training_loss 3.20956,   Relative Error 0.66992


 98%|█████████▊| 1956/2000 [03:12<00:04, 10.37it/s]

Training_loss 3.20951,   Relative Error 0.66988
Training_loss 3.21182,   Relative Error 0.67013
Training_loss 3.21684,   Relative Error 0.67066


 98%|█████████▊| 1960/2000 [03:13<00:03, 10.27it/s]

Training_loss 3.21932,   Relative Error 0.67089
Training_loss 3.22514,   Relative Error 0.67147
Training_loss 3.22632,   Relative Error 0.67152


 98%|█████████▊| 1962/2000 [03:13<00:03,  9.88it/s]

Training_loss 3.22315,   Relative Error 0.67119
Training_loss 3.22756,   Relative Error 0.67160
Training_loss 3.22091,   Relative Error 0.67097


 98%|█████████▊| 1965/2000 [03:13<00:03,  9.76it/s]

Training_loss 3.22558,   Relative Error 0.67143
Training_loss 3.21909,   Relative Error 0.67079


 98%|█████████▊| 1968/2000 [03:13<00:03, 10.26it/s]

Training_loss 3.21574,   Relative Error 0.67044
Training_loss 3.21942,   Relative Error 0.67080
Training_loss 3.22479,   Relative Error 0.67131


 98%|█████████▊| 1970/2000 [03:14<00:02, 10.41it/s]

Training_loss 3.22977,   Relative Error 0.67178
Training_loss 3.23514,   Relative Error 0.67234
Training_loss 3.23473,   Relative Error 0.67230


 99%|█████████▊| 1974/2000 [03:14<00:02, 11.06it/s]

Training_loss 3.23959,   Relative Error 0.67278
Training_loss 3.24480,   Relative Error 0.67332
Training_loss 3.24750,   Relative Error 0.67358


 99%|█████████▉| 1976/2000 [03:14<00:02, 10.53it/s]

Training_loss 3.24563,   Relative Error 0.67343
Training_loss 3.24547,   Relative Error 0.67336


 99%|█████████▉| 1978/2000 [03:14<00:02, 10.06it/s]

Training_loss 3.24413,   Relative Error 0.67320
Training_loss 3.24983,   Relative Error 0.67376
Training_loss 3.25386,   Relative Error 0.67418


 99%|█████████▉| 1982/2000 [03:15<00:01, 10.27it/s]

Training_loss 3.25833,   Relative Error 0.67461
Training_loss 3.25460,   Relative Error 0.67423
Training_loss 3.25829,   Relative Error 0.67455


 99%|█████████▉| 1984/2000 [03:15<00:01, 10.16it/s]

Training_loss 3.25943,   Relative Error 0.67470
Training_loss 3.26351,   Relative Error 0.67511
Training_loss 3.26348,   Relative Error 0.67514


 99%|█████████▉| 1988/2000 [03:15<00:01, 10.64it/s]

Training_loss 3.25995,   Relative Error 0.67482
Training_loss 3.26414,   Relative Error 0.67530
Training_loss 3.26241,   Relative Error 0.67512


100%|█████████▉| 1990/2000 [03:15<00:00, 10.95it/s]

Training_loss 3.26933,   Relative Error 0.67577
Training_loss 3.27491,   Relative Error 0.67638
Training_loss 3.27516,   Relative Error 0.67648


100%|█████████▉| 1994/2000 [03:16<00:00, 11.42it/s]

Training_loss 3.27599,   Relative Error 0.67656
Training_loss 3.27260,   Relative Error 0.67619
Training_loss 3.27112,   Relative Error 0.67605


100%|█████████▉| 1996/2000 [03:16<00:00, 11.59it/s]

Training_loss 3.27186,   Relative Error 0.67608
Training_loss 3.27775,   Relative Error 0.67664
Training_loss 3.27921,   Relative Error 0.67673


100%|██████████| 2000/2000 [03:16<00:00, 11.03it/s]

Training_loss 3.28108,   Relative Error 0.67689
Training_loss 3.28706,   Relative Error 0.67744
Training_loss 3.29104,   Relative Error 0.67780


100%|██████████| 2000/2000 [03:16<00:00, 10.16it/s]


In [21]:
#plot.plot(test_loss)
parameters_to_vector(models[19].parameters())

tensor([-0.4318,  0.8972], grad_fn=<CatBackward0>)

In [22]:
for j in G.neighbors(0):
    print(j)

1
2
3
4
5
6
8
9


In [23]:
parameters_to_vector(models[0].parameters())

tensor([1.6000, 1.6499], grad_fn=<CatBackward0>)

In [24]:
projection_list[0]

[0,
 tensor([[1.6759, 0.0216],
         [0.0324, 1.6650]]),
 tensor([[-0.6451,  0.0216],
         [ 0.0324, -0.6560]]),
 tensor([[0.2735, 0.0216],
         [0.0324, 0.2627]]),
 tensor([[1.8554, 0.0216],
         [0.0324, 1.8446]]),
 tensor([[1.4208, 0.0216],
         [0.0324, 1.4100]]),
 tensor([[1.8028, 0.0216],
         [0.0324, 1.7919]]),
 0,
 tensor([[-0.1485,  0.0216],
         [ 0.0324, -0.1593]]),
 tensor([[0.6351, 0.0216],
         [0.0324, 0.6243]]),
 0,
 0,
 0,
 0,
 0,
 0,
 0,
 0,
 0,
 0]

In [25]:
projected_weights[0]

[0,
 tensor([0.7034, 0.7067]),
 tensor([1.2669, 1.3014]),
 tensor([2.4557, 2.4774]),
 tensor([1.9456, 1.9814]),
 tensor([1.9136, 1.9484]),
 tensor([2.9050, 2.9510]),
 0,
 tensor([-0.7182, -0.7182]),
 tensor([0.6922, 0.7336]),
 0,
 0,
 0,
 0,
 0,
 0,
 0,
 0,
 0,
 0]

In [26]:
test_loss = np.array(test_loss)
total_rel_error = np.array(total_rel_error)

In [27]:
print(test_loss)

[8.87525535 8.84789896 8.80522132 ... 3.28108424 3.28705674 3.29104424]


In [28]:
np.save( 'training_loss_sheave_fml' + str(lamda).replace('.', '_'), test_loss)
np.save('relative_error_sheave_fml' + str(lamda).replace('.', '_'), total_rel_error)