### 2018/2019 - Task List 10

1. Implement Naive Bayes classifier with pyro
    - create apropriate parameters (mean and std for a and b, sigma - noise)
    - provide optimization procedure
    - check appropriateness of implemented method with selected dataset


# Required imports

In [1]:
%matplotlib inline
import pyro
import torch
import numpy as np
import matplotlib.pyplot as plt
import pyro.optim as optim
import pyro.distributions as dist
from torch.distributions import constraints
from tqdm import tqdm
import seaborn as sns
from matplotlib import animation, rc
from IPython.display import HTML
import torch.nn as nn
from functools import partial
import pandas as pd
from pyro.contrib.autoguide import AutoDiagonalNormal
from pyro.infer import EmpiricalMarginal, SVI, Trace_ELBO, TracePredictive

In [2]:
pyro.set_rng_seed(1)
pyro.enable_validation(True)

In [3]:
from sklearn import datasets, model_selection
from sklearn.naive_bayes import GaussianNB


## Solutions

### sklearn solution

In [4]:
iris = datasets.load_iris()

gnb = GaussianNB()


X_train, X_validation, Y_train, Y_validation = model_selection.train_test_split(
    iris.data, iris.target, test_size=0.33, random_state=5)

In [5]:
y_pred = gnb.fit(iris.data, iris.target).predict(iris.data)

In [6]:
kfold = 5
scoring = ['accuracy', 'f1_micro', 'f1_macro']
cv_results = model_selection.cross_validate(gnb, X_train, Y_train, cv=kfold, scoring=scoring)

#displaying the mean and standard deviation of the prediction
for score in scoring: 
    msg = "%s: %f (%f)" % ('NB ' + score, cv_results['test_' + score].mean(), cv_results['test_' + score].std())
    print(msg)

NB accuracy: 0.960902 (0.035958)
NB f1_micro: 0.960902 (0.035958)
NB f1_macro: 0.960191 (0.036241)


### self-made NB

In [7]:
class NaiveBayesClassifier:
    
    def __init__(self, x_data, y_data):
        self.X = x_data
        self.y = y_data
        self.attributes_number = x_data.shape[1]
        self.classes = np.unique(y_data)
    
    def fit(self):
        pass
    
    def predict(self):
        pass
    
    def div_by_category(self, x_data, y_data):
        X_cl = {}

        for i in range(len(x_data)):
            if y_data[i] not in X_cl.keys():
                X_cl[y_data[i]] = list()
            X_cl[y_data[i]].append(x_data[i])

        for cl_key in categories:
            X_cl[cl_key] = np.array(X_cl[cl_key])

        return X_cl
    
    def model(self, x_data, label):
        mean = torch.tensor(np.random.choice(x_data, 1))
        scale = torch.tensor(1.0)
        with pyro.plate('data_loop', len(x_data)):
            pyro.sample('prob', dist.Normal(mean, scale), obs=x_data, infer={'is_auxiliary': True})
        
    def guide(self, x_data, label):
        mean = pyro.param('mean' + str(label), torch.tensor(np.random.choice(x_data, 1)))
        scale = pyro.param('scale' + str(label), torch.tensor(np.random.choice(1.)), constraint=constraints.positive)
        pyro.sample('prob', dist.Normal(mean, scale))
        
        

In [25]:
def div_by_category(x_data, y_data):
    X_cl = {}

    for i in range(len(x_data)):
        for attribute in range(len(x_data[0])):
            if (y_data[i], attribute) not in X_cl.keys():
                X_cl[(y_data[i], attribute)] = list()
            X_cl[(y_data[i], attribute)].append(x_data[i][attribute])

    for cl_key in np.unique(y_data):
        for attribute in range(len(x_data[0])):
            X_cl[cl_key, attribute] = np.array(X_cl[cl_key, attribute])

    return X_cl

def model(x_data, label):
    #mean = torch.tensor(np.random.choice(x_data, 1)).double()
    mean = torch.tensor(2.0).double()
    scale = torch.tensor(1.0).double()
    with pyro.plate('data_loop' + str(label), len(x_data)):
        pyro.sample('prob' + str(label), dist.Normal(mean, scale), obs=x_data)

def guide(x_data, label):
#     x_data = torch.from_numpy(x_data).double()
    mean = pyro.param('mean' + str(label), torch.tensor(2.0))
    scale = pyro.param('scale' + str(label), torch.tensor(1.0), constraint=constraints.positive)
    pyro.sample('prob' + str(label), dist.Normal(mean.double(), scale.double()), infer={'is_auxiliary': True})
    
def train(data, label, num_steps=3000):
    pyro.clear_param_store()
    
    optim = pyro.optim.Adam({"lr": 0.045})
    svi = pyro.infer.SVI(model=model,
                         guide=guide,
                         optim=optim,
                         loss=pyro.infer.Trace_ELBO(), num_samples=len(data))

    losses = []
    t = tqdm(range(num_steps))
    for j in t:
        loss = svi.step(torch.from_numpy(data), label)
        losses.append(loss)
        print(pyro.param("mean" + str(label)))
        t.set_postfix(loss=loss)
    return pyro.param("mean" + str(label)), pyro.param("scale" + str(label)), losses

In [26]:
divided_data = div_by_category(X_train, Y_train)
train(divided_data[(0, 0)], (0,0))








  0%|          | 0/3000 [00:00<?, ?it/s][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=185][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=185][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=185][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=184][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=184][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=184][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=184][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=184][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=184][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=184][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=184][A[A[A[A[A[A[A






  0%|          | 0/3000 [00:00<?, ?it/s, loss=184][A[A[A[A[A[

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









  0%|          | 14/3000 [00:00<00:22, 131.85it/s, loss=183][A[A[A[A[A[A[A






  1%|          | 26/3000 [00:00<00:23, 126.79it/s, loss=183][A[A[A[A[A[A[A






  1%|          | 26/3000 [00:00<00:23, 126.79it/s, loss=183][A[A[A[A[A[A[A






  1%|          | 26/3000 [00:00<00:23, 126.79it/s, loss=183][A[A[A[A[A[A[A






  1%|          | 26/3000 [00:00<00:23, 126.79it/s, loss=183][A[A[A[A[A[A[A






  1%|          | 26/3000 [00:00<00:23, 126.79it/s, loss=183][A[A[A[A[A[A[A






  1%|          | 26/3000 [00:00<00:23, 126.79it/s, loss=183][A[A[A[A[A[A[A






  1%|          | 26/3000 [00:00<00:23, 126.79it/s, loss=183][A[A[A[A[A[A[A






  1%|          | 26/3000 [00:00<00:23, 126.79it/s, loss=183][A[A[A[A[A[A[A






  1%|          | 26/3000 [00:00<00:23, 126.79it/s, loss=183][A[A[A[A[A[A[A






  1%|          | 26/3000 [00:00<00:23, 126.79it/s, loss=183][A[A[A[A[A[A[A






  1%|          | 26/3000 

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


  1%|▏         | 40/3000 [00:00<00:23, 128.50it/s, loss=182][A[A[A[A[A[A[A






  1%|▏         | 40/3000 [00:00<00:23, 128.50it/s, loss=181][A[A[A[A[A[A[A






  2%|▏         | 55/3000 [00:00<00:22, 133.65it/s, loss=181][A[A[A[A[A[A[A






  2%|▏         | 55/3000 [00:00<00:22, 133.65it/s, loss=182][A[A[A[A[A[A[A






  2%|▏         | 55/3000 [00:00<00:22, 133.65it/s, loss=181][A[A[A[A[A[A[A






  2%|▏         | 55/3000 [00:00<00:22, 133.65it/s, loss=182][A[A[A[A[A[A[A






  2%|▏         | 55/3000 [00:00<00:22, 133.65it/s, loss=179][A[A[A[A[A[A[A






  2%|▏         | 55/3000 [00:00<00:22, 133.65it/s, loss=182][A[A[A[A[A[A[A






  2%|▏         | 55/3000 [00:00<00:22, 133.65it/s, loss=180][A[A[A[A[A[A[A






  2%|▏         | 55/3000 [00:00<00:22, 133.65it/s, loss=181][A[A[A[A[A[A[A






  2%|▏         | 55/3000 [00:00<00:22, 133.65it/s, loss=182][A[A[A[A[A[A[A






  2%|▏         | 55/3000 [00:00<

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






  2%|▏         | 66/3000 [00:00<00:24, 121.49it/s, loss=181][A[A[A[A[A[A[A






  2%|▏         | 66/3000 [00:00<00:24, 121.49it/s, loss=181][A[A[A[A[A[A[A






  2%|▏         | 66/3000 [00:00<00:24, 121.49it/s, loss=181][A[A[A[A[A[A[A






  3%|▎         | 80/3000 [00:00<00:23, 124.79it/s, loss=181][A[A[A[A[A[A[A






  3%|▎         | 80/3000 [00:00<00:23, 124.79it/s, loss=180][A[A[A[A[A[A[A






  3%|▎         | 80/3000 [00:00<00:23, 124.79it/s, loss=181][A[A[A[A[A[A[A






  3%|▎         | 80/3000 [00:00<00:23, 124.79it/s, loss=180][A[A[A[A[A[A[A






  3%|▎         | 80/3000 [00:00<00:23, 124.79it/s, loss=181][A[A[A[A[A[A[A






  3%|▎         | 80/3000 [00:00<00:23, 124.79it/s, loss=180][A[A[A[A[A[A[A






  3%|▎         | 80/3000 [00:00<00:23, 124.79it/s, loss=181][A[A[A[A[A[A[A






  3%|▎         | 80/3000 [00:00<00:23, 124.79it/s, loss=181][A[A[A[A[A[A[A






  3%

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


  3%|▎         | 92/3000 [00:00<00:23, 122.16it/s, loss=180][A[A[A[A[A[A[A






  3%|▎         | 92/3000 [00:00<00:23, 122.16it/s, loss=178][A[A[A[A[A[A[A






  3%|▎         | 92/3000 [00:00<00:23, 122.16it/s, loss=180][A[A[A[A[A[A[A






  3%|▎         | 92/3000 [00:00<00:23, 122.16it/s, loss=180][A[A[A[A[A[A[A






  4%|▎         | 108/3000 [00:00<00:22, 130.26it/s, loss=180][A[A[A[A[A[A[A






  4%|▎         | 108/3000 [00:00<00:22, 130.26it/s, loss=180][A[A[A[A[A[A[A






  4%|▎         | 108/3000 [00:00<00:22, 130.26it/s, loss=180][A[A[A[A[A[A[A






  4%|▎         | 108/3000 [00:00<00:22, 130.26it/s, loss=180][A[A[A[A[A[A[A






  4%|▎         | 108/3000 [00:00<00:22, 130.26it/s, loss=179][A[A[A[A[A[A[A






  4%|▎         | 108/3000 [00:00<00:22, 130.26it/s, loss=180][A[A[A[A[A[A[A






  4%|▎         | 108/3000 [00:00<00:22, 130.26it/s, loss=180][A[A[A[A[A[A[A






  4%|▎         | 108/3000

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









  4%|▍         | 123/3000 [00:01<00:21, 134.38it/s, loss=177][A[A[A[A[A[A[A






  4%|▍         | 123/3000 [00:01<00:21, 134.38it/s, loss=174][A[A[A[A[A[A[A






  4%|▍         | 123/3000 [00:01<00:21, 134.38it/s, loss=179][A[A[A[A[A[A[A






  4%|▍         | 123/3000 [00:01<00:21, 134.38it/s, loss=178][A[A[A[A[A[A[A






  5%|▍         | 139/3000 [00:01<00:20, 139.80it/s, loss=178][A[A[A[A[A[A[A






  5%|▍         | 139/3000 [00:01<00:20, 139.80it/s, loss=178][A[A[A[A[A[A[A






  5%|▍         | 139/3000 [00:01<00:20, 139.80it/s, loss=178][A[A[A[A[A[A[A






  5%|▍         | 139/3000 [00:01<00:20, 139.80it/s, loss=177][A[A[A[A[A[A[A






  5%|▍         | 139/3000 [00:01<00:20, 139.80it/s, loss=178][A[A[A[A[A[A[A






  5%|▍         | 139/3000 [00:01<00:20, 139.80it/s, loss=178][A[A[A[A[A[A[A






  5%|▍         | 139/3000 [00:01<00:20, 139.80it/s, loss=176][A[A[A[A[A[A[A






  5%|▍        

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


  5%|▌         | 153/3000 [00:01<00:20, 139.35it/s, loss=177][A[A[A[A[A[A[A






  5%|▌         | 153/3000 [00:01<00:20, 139.35it/s, loss=177][A[A[A[A[A[A[A






  5%|▌         | 153/3000 [00:01<00:20, 139.35it/s, loss=177][A[A[A[A[A[A[A






  5%|▌         | 153/3000 [00:01<00:20, 139.35it/s, loss=177][A[A[A[A[A[A[A






  5%|▌         | 153/3000 [00:01<00:20, 139.35it/s, loss=176][A[A[A[A[A[A[A






  5%|▌         | 153/3000 [00:01<00:20, 139.35it/s, loss=177][A[A[A[A[A[A[A






  6%|▌         | 167/3000 [00:01<00:21, 133.25it/s, loss=177][A[A[A[A[A[A[A






  6%|▌         | 167/3000 [00:01<00:21, 133.25it/s, loss=177][A[A[A[A[A[A[A






  6%|▌         | 167/3000 [00:01<00:21, 133.25it/s, loss=177][A[A[A[A[A[A[A






  6%|▌         | 167/3000 [00:01<00:21, 133.25it/s, loss=177][A[A[A[A[A[A[A






  6%|▌         | 167/3000 [00:01<00:21, 133.25it/s, loss=175][A[A[A[A[A[A[A






  6%|▌         | 167/

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






  6%|▌         | 181/3000 [00:01<00:21, 131.53it/s, loss=176][A[A[A[A[A[A[A






  6%|▌         | 181/3000 [00:01<00:21, 131.53it/s, loss=175][A[A[A[A[A[A[A






  6%|▌         | 181/3000 [00:01<00:21, 131.53it/s, loss=175][A[A[A[A[A[A[A






  6%|▌         | 181/3000 [00:01<00:21, 131.53it/s, loss=175][A[A[A[A[A[A[A






  6%|▌         | 181/3000 [00:01<00:21, 131.53it/s, loss=176][A[A[A[A[A[A[A






  6%|▌         | 181/3000 [00:01<00:21, 131.53it/s, loss=176][A[A[A[A[A[A[A






  6%|▌         | 181/3000 [00:01<00:21, 131.53it/s, loss=175][A[A[A[A[A[A[A






  7%|▋         | 196/3000 [00:01<00:20, 134.65it/s, loss=175][A[A[A[A[A[A[A






  7%|▋         | 196/3000 [00:01<00:20, 134.65it/s, loss=176][A[A[A[A[A[A[A






  7%|▋         | 196/3000 [00:01<00:20, 134.65it/s, loss=176][A[A[A[A[A[A[A






  7%|▋         | 196/3000 [00:01<00:20, 134.65it/s, loss=175][A[A[A[A[A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


  7%|▋         | 211/3000 [00:01<00:20, 136.56it/s, loss=175][A[A[A[A[A[A[A






  7%|▋         | 211/3000 [00:01<00:20, 136.56it/s, loss=171][A[A[A[A[A[A[A






  7%|▋         | 211/3000 [00:01<00:20, 136.56it/s, loss=175][A[A[A[A[A[A[A






  7%|▋         | 211/3000 [00:01<00:20, 136.56it/s, loss=175][A[A[A[A[A[A[A






  7%|▋         | 211/3000 [00:01<00:20, 136.56it/s, loss=174][A[A[A[A[A[A[A






  7%|▋         | 211/3000 [00:01<00:20, 136.56it/s, loss=175][A[A[A[A[A[A[A






  7%|▋         | 211/3000 [00:01<00:20, 136.56it/s, loss=169][A[A[A[A[A[A[A






  7%|▋         | 211/3000 [00:01<00:20, 136.56it/s, loss=175][A[A[A[A[A[A[A






  8%|▊         | 225/3000 [00:01<00:20, 134.85it/s, loss=175][A[A[A[A[A[A[A






  8%|▊         | 225/3000 [00:01<00:20, 134.85it/s, loss=175][A[A[A[A[A[A[A






  8%|▊         | 225/3000 [00:01<00:20, 134.85it/s, loss=175][A[A[A[A[A[A[A






  8%|▊         | 225/

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









  8%|▊         | 239/3000 [00:01<00:20, 135.18it/s, loss=174][A[A[A[A[A[A[A






  8%|▊         | 239/3000 [00:01<00:20, 135.18it/s, loss=173][A[A[A[A[A[A[A






  8%|▊         | 239/3000 [00:01<00:20, 135.18it/s, loss=174][A[A[A[A[A[A[A






  8%|▊         | 239/3000 [00:01<00:20, 135.18it/s, loss=173][A[A[A[A[A[A[A






  8%|▊         | 239/3000 [00:01<00:20, 135.18it/s, loss=173][A[A[A[A[A[A[A






  8%|▊         | 239/3000 [00:01<00:20, 135.18it/s, loss=173][A[A[A[A[A[A[A






  8%|▊         | 239/3000 [00:01<00:20, 135.18it/s, loss=172][A[A[A[A[A[A[A






  8%|▊         | 253/3000 [00:01<00:20, 134.43it/s, loss=172][A[A[A[A[A[A[A






  8%|▊         | 253/3000 [00:01<00:20, 134.43it/s, loss=173][A[A[A[A[A[A[A






  8%|▊         | 253/3000 [00:01<00:20, 134.43it/s, loss=173][A[A[A[A[A[A[A






  8%|▊         | 253/3000 [00:01<00:20, 134.43it/s, loss=173][A[A[A[A[A[A[A






  8%|▊        

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









  9%|▉         | 267/3000 [00:02<00:20, 134.31it/s, loss=172][A[A[A[A[A[A[A






  9%|▉         | 267/3000 [00:02<00:20, 134.31it/s, loss=172][A[A[A[A[A[A[A






  9%|▉         | 267/3000 [00:02<00:20, 134.31it/s, loss=172][A[A[A[A[A[A[A






  9%|▉         | 267/3000 [00:02<00:20, 134.31it/s, loss=172][A[A[A[A[A[A[A






  9%|▉         | 267/3000 [00:02<00:20, 134.31it/s, loss=171][A[A[A[A[A[A[A






  9%|▉         | 267/3000 [00:02<00:20, 134.31it/s, loss=172][A[A[A[A[A[A[A






  9%|▉         | 267/3000 [00:02<00:20, 134.31it/s, loss=172][A[A[A[A[A[A[A






  9%|▉         | 267/3000 [00:02<00:20, 134.31it/s, loss=172][A[A[A[A[A[A[A






  9%|▉         | 267/3000 [00:02<00:20, 134.31it/s, loss=171][A[A[A[A[A[A[A






  9%|▉         | 283/3000 [00:02<00:19, 139.01it/s, loss=171][A[A[A[A[A[A[A






  9%|▉         | 283/3000 [00:02<00:19, 139.01it/s, loss=172][A[A[A[A[A[A[A






  9%|▉        

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 10%|▉         | 297/3000 [00:02<00:19, 136.62it/s, loss=170][A[A[A[A[A[A[A






 10%|▉         | 297/3000 [00:02<00:19, 136.62it/s, loss=171][A[A[A[A[A[A[A






 10%|▉         | 297/3000 [00:02<00:19, 136.62it/s, loss=171][A[A[A[A[A[A[A






 10%|▉         | 297/3000 [00:02<00:19, 136.62it/s, loss=171][A[A[A[A[A[A[A






 10%|▉         | 297/3000 [00:02<00:19, 136.62it/s, loss=169][A[A[A[A[A[A[A






 10%|▉         | 297/3000 [00:02<00:19, 136.62it/s, loss=171][A[A[A[A[A[A[A






 10%|▉         | 297/3000 [00:02<00:19, 136.62it/s, loss=169][A[A[A[A[A[A[A






 10%|▉         | 297/3000 [00:02<00:19, 136.62it/s, loss=170][A[A[A[A[A[A[A






 10%|▉         | 297/3000 [00:02<00:19, 136.62it/s, loss=171][A[A[A[A[A[A[A






 10%|█         | 311/3000 [00:02<00:19, 135.92it/s, loss=171][A[A[A[A[A[A[A






 10%|█         | 311/3000 [00:02<00:19, 135.92it/s, loss=171][A[A[A[A[A[A[A






 10%|█        

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 11%|█         | 325/3000 [00:02<00:19, 135.24it/s, loss=170][A[A[A[A[A[A[A






 11%|█         | 325/3000 [00:02<00:19, 135.24it/s, loss=169][A[A[A[A[A[A[A






 11%|█         | 325/3000 [00:02<00:19, 135.24it/s, loss=170][A[A[A[A[A[A[A






 11%|█         | 325/3000 [00:02<00:19, 135.24it/s, loss=170][A[A[A[A[A[A[A






 11%|█         | 325/3000 [00:02<00:19, 135.24it/s, loss=169][A[A[A[A[A[A[A






 11%|█         | 325/3000 [00:02<00:19, 135.24it/s, loss=170][A[A[A[A[A[A[A






 11%|█         | 325/3000 [00:02<00:19, 135.24it/s, loss=170][A[A[A[A[A[A[A






 11%|█         | 325/3000 [00:02<00:19, 135.24it/s, loss=169][A[A[A[A[A[A[A






 11%|█         | 325/3000 [00:02<00:19, 135.24it/s, loss=169][A[A[A[A[A[A[A






 11%|█▏        | 339/3000 [00:02<00:19, 134.06it/s, loss=169][A[A[A[A[A[A[A






 11%|█▏        | 339/3000 [00:02<00:19, 134.06it/s, loss=169][A[A[A[A[A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 12%|█▏        | 354/3000 [00:02<00:19, 137.45it/s, loss=169][A[A[A[A[A[A[A






 12%|█▏        | 354/3000 [00:02<00:19, 137.45it/s, loss=168][A[A[A[A[A[A[A






 12%|█▏        | 354/3000 [00:02<00:19, 137.45it/s, loss=169][A[A[A[A[A[A[A






 12%|█▏        | 354/3000 [00:02<00:19, 137.45it/s, loss=168][A[A[A[A[A[A[A






 12%|█▏        | 354/3000 [00:02<00:19, 137.45it/s, loss=168][A[A[A[A[A[A[A






 12%|█▏        | 354/3000 [00:02<00:19, 137.45it/s, loss=168][A[A[A[A[A[A[A






 12%|█▏        | 354/3000 [00:02<00:19, 137.45it/s, loss=168][A[A[A[A[A[A[A






 12%|█▏        | 354/3000 [00:02<00:19, 137.45it/s, loss=167][A[A[A[A[A[A[A






 12%|█▏        | 354/3000 [00:02<00:19, 137.45it/s, loss=168][A[A[A[A[A[A[A






 12%|█▏        | 354/3000 [00:02<00:19, 137.45it/s, loss=168][A[A[A[A[A[A[A






 12%|█▏        | 354/3000 [00:02<00:19, 137.45it/s, loss=166][A[A[A[A[A[A[A






 12%|█▏       

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 13%|█▎        | 385/3000 [00:02<00:18, 142.93it/s, loss=166][A[A[A[A[A[A[A






 13%|█▎        | 385/3000 [00:02<00:18, 142.93it/s, loss=166][A[A[A[A[A[A[A






 13%|█▎        | 385/3000 [00:02<00:18, 142.93it/s, loss=167][A[A[A[A[A[A[A






 13%|█▎        | 385/3000 [00:02<00:18, 142.93it/s, loss=167][A[A[A[A[A[A[A






 13%|█▎        | 385/3000 [00:02<00:18, 142.93it/s, loss=167][A[A[A[A[A[A[A






 13%|█▎        | 385/3000 [00:02<00:18, 142.93it/s, loss=166][A[A[A[A[A[A[A






 13%|█▎        | 385/3000 [00:02<00:18, 142.93it/s, loss=166][A[A[A[A[A[A[A






 13%|█▎        | 385/3000 [00:02<00:18, 142.93it/s, loss=166][A[A[A[A[A[A[A






 13%|█▎        | 385/3000 [00:02<00:18, 142.93it/s, loss=167][A[A[A[A[A[A[A






 13%|█▎        | 385/3000 [00:02<00:18, 142.93it/s, loss=167][A[A[A[A[A[A[A






 13%|█▎        | 385/3000 [00:02<00:18, 142.93it/s, loss=165][A[A[A[A[A[A[A






 13%|█▎       

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 14%|█▍        | 414/3000 [00:03<00:19, 131.89it/s, loss=166][A[A[A[A[A[A[A






 14%|█▍        | 414/3000 [00:03<00:19, 131.89it/s, loss=166][A[A[A[A[A[A[A






 14%|█▍        | 414/3000 [00:03<00:19, 131.89it/s, loss=166][A[A[A[A[A[A[A






 14%|█▍        | 414/3000 [00:03<00:19, 131.89it/s, loss=165][A[A[A[A[A[A[A






 14%|█▍        | 414/3000 [00:03<00:19, 131.89it/s, loss=166][A[A[A[A[A[A[A






 14%|█▍        | 414/3000 [00:03<00:19, 131.89it/s, loss=166][A[A[A[A[A[A[A






 14%|█▍        | 414/3000 [00:03<00:19, 131.89it/s, loss=166][A[A[A[A[A[A[A






 14%|█▍        | 414/3000 [00:03<00:19, 131.89it/s, loss=166][A[A[A[A[A[A[A






 14%|█▍        | 414/3000 [00:03<00:19, 131.89it/s, loss=164][A[A[A[A[A[A[A






 14%|█▍        | 414/3000 [00:03<00:19, 131.89it/s, loss=166][A[A[A[A[A[A[A






 14%|█▍        | 414/3000 [00:03<00:19, 131.89it/s, loss=165][A[A[A[A[A[A[A






 14%|█▍       

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 15%|█▍        | 442/3000 [00:03<00:19, 133.26it/s, loss=165][A[A[A[A[A[A[A






 15%|█▍        | 442/3000 [00:03<00:19, 133.26it/s, loss=165][A[A[A[A[A[A[A






 15%|█▍        | 442/3000 [00:03<00:19, 133.26it/s, loss=164][A[A[A[A[A[A[A






 15%|█▍        | 442/3000 [00:03<00:19, 133.26it/s, loss=165][A[A[A[A[A[A[A






 15%|█▍        | 442/3000 [00:03<00:19, 133.26it/s, loss=164][A[A[A[A[A[A[A






 15%|█▍        | 442/3000 [00:03<00:19, 133.26it/s, loss=165][A[A[A[A[A[A[A






 15%|█▍        | 442/3000 [00:03<00:19, 133.26it/s, loss=164][A[A[A[A[A[A[A






 15%|█▍        | 442/3000 [00:03<00:19, 133.26it/s, loss=164][A[A[A[A[A[A[A






 15%|█▍        | 442/3000 [00:03<00:19, 133.26it/s, loss=164][A[A[A[A[A[A[A






 15%|█▍        | 442/3000 [00:03<00:19, 133.26it/s, loss=164][A[A[A[A[A[A[A






 15%|█▍        | 442/3000 [00:03<00:19, 133.26it/s, loss=164][A[A[A[A[A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2

[A[A[A[A[A[A[A






 16%|█▌        | 475/3000 [00:03<00:17, 145.19it/s, loss=163][A[A[A[A[A[A[A






 16%|█▌        | 475/3000 [00:03<00:17, 145.19it/s, loss=163][A[A[A[A[A[A[A






 16%|█▌        | 475/3000 [00:03<00:17, 145.19it/s, loss=163][A[A[A[A[A[A[A






 16%|█▌        | 475/3000 [00:03<00:17, 145.19it/s, loss=163][A[A[A[A[A[A[A






 16%|█▌        | 475/3000 [00:03<00:17, 145.19it/s, loss=162][A[A[A[A[A[A[A






 16%|█▌        | 475/3000 [00:03<00:17, 145.19it/s, loss=163][A[A[A[A[A[A[A






 16%|█▌        | 475/3000 [00:03<00:17, 145.19it/s, loss=162][A[A[A[A[A[A[A






 16%|█▌        | 475/3000 [00:03<00:17, 145.19it/s, loss=162][A[A[A[A[A[A[A






 16%|█▌        | 475/3000 [00:03<00:17, 145.19it/s, loss=163][A[A[A[A[A[A[A






 16%|█▌        | 475/3000 [00:03<00:17, 145.19it/s, loss=163][A[A[A[A[A[A[A






 16%|█▌        | 475/3000 [00:03<00:17, 145.19it/s, loss=162][A[A[A[A[A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2








 17%|█▋        | 508/3000 [00:03<00:16, 152.08it/s, loss=162][A[A[A[A[A[A[A






 17%|█▋        | 508/3000 [00:03<00:16, 152.08it/s, loss=162][A[A[A[A[A[A[A






 17%|█▋        | 508/3000 [00:03<00:16, 152.08it/s, loss=162][A[A[A[A[A[A[A






 17%|█▋        | 508/3000 [00:03<00:16, 152.08it/s, loss=161][A[A[A[A[A[A[A






 17%|█▋        | 508/3000 [00:03<00:16, 152.08it/s, loss=162][A[A[A[A[A[A[A






 17%|█▋        | 508/3000 [00:03<00:16, 152.08it/s, loss=161][A[A[A[A[A[A[A






 17%|█▋        | 508/3000 [00:03<00:16, 152.08it/s, loss=162][A[A[A[A[A[A[A






 17%|█▋        | 508/3000 [00:03<00:16, 152.08it/s, loss=161][A[A[A[A[A[A[A






 17%|█▋        | 508/3000 [00:03<00:16, 152.08it/s, loss=162][A[A[A[A[A[A[A






 17%|█▋        | 508/3000 [00:03<00:16, 152.08it/s, loss=161][A[A[A[A[A[A[A






 17%|█▋        | 508/3000 [00:03<00:16, 152.08it/s, loss=161][A[A[A[A[A[A[A






 17%|█▋       

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 17%|█▋        | 524/3000 [00:03<00:17, 144.06it/s, loss=160][A[A[A[A[A[A[A






 17%|█▋        | 524/3000 [00:03<00:17, 144.06it/s, loss=161][A[A[A[A[A[A[A






 17%|█▋        | 524/3000 [00:03<00:17, 144.06it/s, loss=160][A[A[A[A[A[A[A






 17%|█▋        | 524/3000 [00:03<00:17, 144.06it/s, loss=160][A[A[A[A[A[A[A






 17%|█▋        | 524/3000 [00:03<00:17, 144.06it/s, loss=161][A[A[A[A[A[A[A






 17%|█▋        | 524/3000 [00:03<00:17, 144.06it/s, loss=160][A[A[A[A[A[A[A






 18%|█▊        | 539/3000 [00:03<00:18, 129.53it/s, loss=160][A[A[A[A[A[A[A






 18%|█▊        | 539/3000 [00:03<00:18, 129.53it/s, loss=160][A[A[A[A[A[A[A






 18%|█▊        | 539/3000 [00:03<00:18, 129.53it/s, loss=159][A[A[A[A[A[A[A






 18%|█▊        | 539/3000 [00:03<00:18, 129.53it/s, loss=159][A[A[A[A[A[A[A






 18%|█▊        | 539/3000 [00:03<00:18, 129.53it/s, loss=159][A[A[A[A[A[A[A






 18%|█▊       

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 18%|█▊        | 553/3000 [00:04<00:20, 116.61it/s, loss=160][A[A[A[A[A[A[A






 18%|█▊        | 553/3000 [00:04<00:20, 116.61it/s, loss=160][A[A[A[A[A[A[A






 18%|█▊        | 553/3000 [00:04<00:20, 116.61it/s, loss=160][A[A[A[A[A[A[A






 18%|█▊        | 553/3000 [00:04<00:20, 116.61it/s, loss=159][A[A[A[A[A[A[A






 18%|█▊        | 553/3000 [00:04<00:20, 116.61it/s, loss=160][A[A[A[A[A[A[A






 18%|█▊        | 553/3000 [00:04<00:20, 116.61it/s, loss=156][A[A[A[A[A[A[A






 18%|█▊        | 553/3000 [00:04<00:20, 116.61it/s, loss=160][A[A[A[A[A[A[A






 18%|█▊        | 553/3000 [00:04<00:20, 116.61it/s, loss=160][A[A[A[A[A[A[A






 18%|█▊        | 553/3000 [00:04<00:20, 116.61it/s, loss=158][A[A[A[A[A[A[A






 18%|█▊        | 553/3000 [00:04<00:20, 116.61it/s, loss=158][A[A[A[A[A[A[A






 18%|█▊        | 553/3000 [00:04<00:20, 116.61it/s, loss=158][A[A[A[A[A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


 19%|█▉        | 566/3000 [00:04<00:20, 116.15it/s, loss=158][A[A[A[A[A[A[A






 19%|█▉        | 578/3000 [00:04<00:21, 115.02it/s, loss=158][A[A[A[A[A[A[A






 19%|█▉        | 578/3000 [00:04<00:21, 115.02it/s, loss=159][A[A[A[A[A[A[A






 19%|█▉        | 578/3000 [00:04<00:21, 115.02it/s, loss=158][A[A[A[A[A[A[A






 19%|█▉        | 578/3000 [00:04<00:21, 115.02it/s, loss=159][A[A[A[A[A[A[A






 19%|█▉        | 578/3000 [00:04<00:21, 115.02it/s, loss=158][A[A[A[A[A[A[A






 19%|█▉        | 578/3000 [00:04<00:21, 115.02it/s, loss=159][A[A[A[A[A[A[A






 19%|█▉        | 578/3000 [00:04<00:21, 115.02it/s, loss=158][A[A[A[A[A[A[A






 19%|█▉        | 578/3000 [00:04<00:21, 115.02it/s, loss=158][A[A[A[A[A[A[A






 19%|█▉        | 578/3000 [00:04<00:21, 115.02it/s, loss=158][A[A[A[A[A[A[A






 19%|█▉        | 578/3000 [00:04<00:21, 115.02it/s, loss=158][A[A[A[A[A[A[A






 19%|█▉        | 578/

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 20%|█▉        | 594/3000 [00:04<00:19, 123.52it/s, loss=157][A[A[A[A[A[A[A






 20%|█▉        | 594/3000 [00:04<00:19, 123.52it/s, loss=157][A[A[A[A[A[A[A






 20%|█▉        | 594/3000 [00:04<00:19, 123.52it/s, loss=157][A[A[A[A[A[A[A






 20%|█▉        | 594/3000 [00:04<00:19, 123.52it/s, loss=157][A[A[A[A[A[A[A






 20%|█▉        | 594/3000 [00:04<00:19, 123.52it/s, loss=157][A[A[A[A[A[A[A






 20%|██        | 607/3000 [00:04<00:21, 113.09it/s, loss=157][A[A[A[A[A[A[A






 20%|██        | 607/3000 [00:04<00:21, 113.09it/s, loss=157][A[A[A[A[A[A[A






 20%|██        | 607/3000 [00:04<00:21, 113.09it/s, loss=157][A[A[A[A[A[A[A






 20%|██        | 607/3000 [00:04<00:21, 113.09it/s, loss=156][A[A[A[A[A[A[A






 20%|██        | 607/3000 [00:04<00:21, 113.09it/s, loss=157][A[A[A[A[A[A[A






 20%|██        | 607/3000 [00:04<00:21, 113.09it/s, loss=157][A[A[A[A[A[A[A






 20%|██       

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


 21%|██        | 619/3000 [00:04<00:21, 112.27it/s, loss=157][A[A[A[A[A[A[A






 21%|██        | 619/3000 [00:04<00:21, 112.27it/s, loss=157][A[A[A[A[A[A[A






 21%|██        | 619/3000 [00:04<00:21, 112.27it/s, loss=157][A[A[A[A[A[A[A






 21%|██        | 619/3000 [00:04<00:21, 112.27it/s, loss=156][A[A[A[A[A[A[A






 21%|██        | 619/3000 [00:04<00:21, 112.27it/s, loss=156][A[A[A[A[A[A[A






 21%|██        | 619/3000 [00:04<00:21, 112.27it/s, loss=156][A[A[A[A[A[A[A






 21%|██        | 619/3000 [00:04<00:21, 112.27it/s, loss=156][A[A[A[A[A[A[A






 21%|██        | 619/3000 [00:04<00:21, 112.27it/s, loss=156][A[A[A[A[A[A[A






 21%|██        | 632/3000 [00:04<00:20, 115.61it/s, loss=156][A[A[A[A[A[A[A






 21%|██        | 632/3000 [00:04<00:20, 115.61it/s, loss=156][A[A[A[A[A[A[A






 21%|██        | 632/3000 [00:04<00:20, 115.61it/s, loss=155][A[A[A[A[A[A[A






 21%|██        | 632/

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 21%|██▏       | 644/3000 [00:04<00:20, 116.62it/s, loss=155][A[A[A[A[A[A[A






 21%|██▏       | 644/3000 [00:04<00:20, 116.62it/s, loss=153][A[A[A[A[A[A[A






 21%|██▏       | 644/3000 [00:04<00:20, 116.62it/s, loss=155][A[A[A[A[A[A[A






 21%|██▏       | 644/3000 [00:04<00:20, 116.62it/s, loss=154][A[A[A[A[A[A[A






 21%|██▏       | 644/3000 [00:04<00:20, 116.62it/s, loss=155][A[A[A[A[A[A[A






 21%|██▏       | 644/3000 [00:04<00:20, 116.62it/s, loss=154][A[A[A[A[A[A[A






 21%|██▏       | 644/3000 [00:04<00:20, 116.62it/s, loss=155][A[A[A[A[A[A[A






 22%|██▏       | 659/3000 [00:04<00:18, 124.94it/s, loss=155][A[A[A[A[A[A[A






 22%|██▏       | 659/3000 [00:04<00:18, 124.94it/s, loss=154][A[A[A[A[A[A[A






 22%|██▏       | 659/3000 [00:05<00:18, 124.94it/s, loss=155][A[A[A[A[A[A[A






 22%|██▏       | 659/3000 [00:05<00:18, 124.94it/s, loss=155][A[A[A[A[A[A[A






 22%|██▏      

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 22%|██▎       | 675/3000 [00:05<00:17, 132.76it/s, loss=153][A[A[A[A[A[A[A






 22%|██▎       | 675/3000 [00:05<00:17, 132.76it/s, loss=154][A[A[A[A[A[A[A






 22%|██▎       | 675/3000 [00:05<00:17, 132.76it/s, loss=153][A[A[A[A[A[A[A






 22%|██▎       | 675/3000 [00:05<00:17, 132.76it/s, loss=153][A[A[A[A[A[A[A






 22%|██▎       | 675/3000 [00:05<00:17, 132.76it/s, loss=154][A[A[A[A[A[A[A






 22%|██▎       | 675/3000 [00:05<00:17, 132.76it/s, loss=152][A[A[A[A[A[A[A






 23%|██▎       | 689/3000 [00:05<00:18, 125.20it/s, loss=152][A[A[A[A[A[A[A






 23%|██▎       | 689/3000 [00:05<00:18, 125.20it/s, loss=153][A[A[A[A[A[A[A






 23%|██▎       | 689/3000 [00:05<00:18, 125.20it/s, loss=153][A[A[A[A[A[A[A






 23%|██▎       | 689/3000 [00:05<00:18, 125.20it/s, loss=153][A[A[A[A[A[A[A






 23%|██▎       | 689/3000 [00:05<00:18, 125.20it/s, loss=153][A[A[A[A[A[A[A






 23%|██▎      

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 23%|██▎       | 703/3000 [00:05<00:18, 125.98it/s, loss=153][A[A[A[A[A[A[A






 23%|██▎       | 703/3000 [00:05<00:18, 125.98it/s, loss=153][A[A[A[A[A[A[A






 23%|██▎       | 703/3000 [00:05<00:18, 125.98it/s, loss=151][A[A[A[A[A[A[A






 23%|██▎       | 703/3000 [00:05<00:18, 125.98it/s, loss=152][A[A[A[A[A[A[A






 23%|██▎       | 703/3000 [00:05<00:18, 125.98it/s, loss=153][A[A[A[A[A[A[A






 23%|██▎       | 703/3000 [00:05<00:18, 125.98it/s, loss=152][A[A[A[A[A[A[A






 23%|██▎       | 703/3000 [00:05<00:18, 125.98it/s, loss=153][A[A[A[A[A[A[A






 23%|██▎       | 703/3000 [00:05<00:18, 125.98it/s, loss=153][A[A[A[A[A[A[A






 23%|██▎       | 703/3000 [00:05<00:18, 125.98it/s, loss=152][A[A[A[A[A[A[A






 23%|██▎       | 703/3000 [00:05<00:18, 125.98it/s, loss=153][A[A[A[A[A[A[A






 24%|██▍       | 716/3000 [00:05<00:17, 127.08it/s, loss=153][A[A[A[A[A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 24%|██▍       | 730/3000 [00:05<00:17, 130.06it/s, loss=150][A[A[A[A[A[A[A






 24%|██▍       | 730/3000 [00:05<00:17, 130.06it/s, loss=152][A[A[A[A[A[A[A






 24%|██▍       | 730/3000 [00:05<00:17, 130.06it/s, loss=151][A[A[A[A[A[A[A






 24%|██▍       | 730/3000 [00:05<00:17, 130.06it/s, loss=150][A[A[A[A[A[A[A






 24%|██▍       | 730/3000 [00:05<00:17, 130.06it/s, loss=152][A[A[A[A[A[A[A






 24%|██▍       | 730/3000 [00:05<00:17, 130.06it/s, loss=151][A[A[A[A[A[A[A






 24%|██▍       | 730/3000 [00:05<00:17, 130.06it/s, loss=149][A[A[A[A[A[A[A






 24%|██▍       | 730/3000 [00:05<00:17, 130.06it/s, loss=150][A[A[A[A[A[A[A






 24%|██▍       | 730/3000 [00:05<00:17, 130.06it/s, loss=151][A[A[A[A[A[A[A






 24%|██▍       | 730/3000 [00:05<00:17, 130.06it/s, loss=151][A[A[A[A[A[A[A






 24%|██▍       | 730/3000 [00:05<00:17, 130.06it/s, loss=151][A[A[A[A[A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 25%|██▌       | 760/3000 [00:05<00:16, 134.86it/s, loss=150][A[A[A[A[A[A[A






 25%|██▌       | 760/3000 [00:05<00:16, 134.86it/s, loss=150][A[A[A[A[A[A[A






 25%|██▌       | 760/3000 [00:05<00:16, 134.86it/s, loss=148][A[A[A[A[A[A[A






 25%|██▌       | 760/3000 [00:05<00:16, 134.86it/s, loss=150][A[A[A[A[A[A[A






 25%|██▌       | 760/3000 [00:05<00:16, 134.86it/s, loss=148][A[A[A[A[A[A[A






 25%|██▌       | 760/3000 [00:05<00:16, 134.86it/s, loss=150][A[A[A[A[A[A[A






 25%|██▌       | 760/3000 [00:05<00:16, 134.86it/s, loss=149][A[A[A[A[A[A[A






 25%|██▌       | 760/3000 [00:05<00:16, 134.86it/s, loss=150][A[A[A[A[A[A[A






 25%|██▌       | 760/3000 [00:05<00:16, 134.86it/s, loss=150][A[A[A[A[A[A[A






 25%|██▌       | 760/3000 [00:05<00:16, 134.86it/s, loss=149][A[A[A[A[A[A[A






 25%|██▌       | 760/3000 [00:05<00:16, 134.86it/s, loss=150][A[A[A[A[A[A[A






 26%|██▌      

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 26%|██▋       | 788/3000 [00:05<00:16, 133.11it/s, loss=149][A[A[A[A[A[A[A






 26%|██▋       | 788/3000 [00:05<00:16, 133.11it/s, loss=148][A[A[A[A[A[A[A






 26%|██▋       | 788/3000 [00:05<00:16, 133.11it/s, loss=149][A[A[A[A[A[A[A






 26%|██▋       | 788/3000 [00:05<00:16, 133.11it/s, loss=149][A[A[A[A[A[A[A






 26%|██▋       | 788/3000 [00:05<00:16, 133.11it/s, loss=148][A[A[A[A[A[A[A






 26%|██▋       | 788/3000 [00:06<00:16, 133.11it/s, loss=149][A[A[A[A[A[A[A






 26%|██▋       | 788/3000 [00:06<00:16, 133.11it/s, loss=148][A[A[A[A[A[A[A






 26%|██▋       | 788/3000 [00:06<00:16, 133.11it/s, loss=149][A[A[A[A[A[A[A






 26%|██▋       | 788/3000 [00:06<00:16, 133.11it/s, loss=149][A[A[A[A[A[A[A






 26%|██▋       | 788/3000 [00:06<00:16, 133.11it/s, loss=148][A[A[A[A[A[A[A






 26%|██▋       | 788/3000 [00:06<00:16, 133.11it/s, loss=149][A[A[A[A[A[A[A






 26%|██▋      

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 27%|██▋       | 819/3000 [00:06<00:15, 142.41it/s, loss=147][A[A[A[A[A[A[A






 27%|██▋       | 819/3000 [00:06<00:15, 142.41it/s, loss=148][A[A[A[A[A[A[A






 27%|██▋       | 819/3000 [00:06<00:15, 142.41it/s, loss=148][A[A[A[A[A[A[A






 27%|██▋       | 819/3000 [00:06<00:15, 142.41it/s, loss=147][A[A[A[A[A[A[A






 27%|██▋       | 819/3000 [00:06<00:15, 142.41it/s, loss=148][A[A[A[A[A[A[A






 27%|██▋       | 819/3000 [00:06<00:15, 142.41it/s, loss=146][A[A[A[A[A[A[A






 27%|██▋       | 819/3000 [00:06<00:15, 142.41it/s, loss=147][A[A[A[A[A[A[A






 27%|██▋       | 819/3000 [00:06<00:15, 142.41it/s, loss=147][A[A[A[A[A[A[A






 27%|██▋       | 819/3000 [00:06<00:15, 142.41it/s, loss=146][A[A[A[A[A[A[A






 27%|██▋       | 819/3000 [00:06<00:15, 142.41it/s, loss=147][A[A[A[A[A[A[A






 27%|██▋       | 819/3000 [00:06<00:15, 142.41it/s, loss=147][A[A[A[A[A[A[A






 27%|██▋      

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 28%|██▊       | 834/3000 [00:06<00:16, 128.94it/s, loss=145][A[A[A[A[A[A[A






 28%|██▊       | 834/3000 [00:06<00:16, 128.94it/s, loss=146][A[A[A[A[A[A[A






 28%|██▊       | 834/3000 [00:06<00:16, 128.94it/s, loss=146][A[A[A[A[A[A[A






 28%|██▊       | 834/3000 [00:06<00:16, 128.94it/s, loss=147][A[A[A[A[A[A[A






 28%|██▊       | 834/3000 [00:06<00:16, 128.94it/s, loss=147][A[A[A[A[A[A[A






 28%|██▊       | 850/3000 [00:06<00:16, 133.07it/s, loss=147][A[A[A[A[A[A[A






 28%|██▊       | 850/3000 [00:06<00:16, 133.07it/s, loss=146][A[A[A[A[A[A[A






 28%|██▊       | 850/3000 [00:06<00:16, 133.07it/s, loss=146][A[A[A[A[A[A[A






 28%|██▊       | 850/3000 [00:06<00:16, 133.07it/s, loss=146][A[A[A[A[A[A[A






 28%|██▊       | 850/3000 [00:06<00:16, 133.07it/s, loss=145][A[A[A[A[A[A[A






 28%|██▊       | 850/3000 [00:06<00:16, 133.07it/s, loss=143][A[A[A[A[A[A[A






 28%|██▊      

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 29%|██▉       | 865/3000 [00:06<00:15, 136.04it/s, loss=144][A[A[A[A[A[A[A






 29%|██▉       | 865/3000 [00:06<00:15, 136.04it/s, loss=144][A[A[A[A[A[A[A






 29%|██▉       | 865/3000 [00:06<00:15, 136.04it/s, loss=145][A[A[A[A[A[A[A






 29%|██▉       | 865/3000 [00:06<00:15, 136.04it/s, loss=145][A[A[A[A[A[A[A






 29%|██▉       | 865/3000 [00:06<00:15, 136.04it/s, loss=145][A[A[A[A[A[A[A






 29%|██▉       | 865/3000 [00:06<00:15, 136.04it/s, loss=145][A[A[A[A[A[A[A






 29%|██▉       | 881/3000 [00:06<00:15, 141.10it/s, loss=145][A[A[A[A[A[A[A






 29%|██▉       | 881/3000 [00:06<00:15, 141.10it/s, loss=145][A[A[A[A[A[A[A






 29%|██▉       | 881/3000 [00:06<00:15, 141.10it/s, loss=145][A[A[A[A[A[A[A






 29%|██▉       | 881/3000 [00:06<00:15, 141.10it/s, loss=144][A[A[A[A[A[A[A






 29%|██▉       | 881/3000 [00:06<00:15, 141.10it/s, loss=144][A[A[A[A[A[A[A






 29%|██▉      

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 30%|██▉       | 896/3000 [00:06<00:15, 139.66it/s, loss=144][A[A[A[A[A[A[A






 30%|██▉       | 896/3000 [00:06<00:15, 139.66it/s, loss=144][A[A[A[A[A[A[A






 30%|██▉       | 896/3000 [00:06<00:15, 139.66it/s, loss=144][A[A[A[A[A[A[A






 30%|██▉       | 896/3000 [00:06<00:15, 139.66it/s, loss=144][A[A[A[A[A[A[A






 30%|██▉       | 896/3000 [00:06<00:15, 139.66it/s, loss=142][A[A[A[A[A[A[A






 30%|██▉       | 896/3000 [00:06<00:15, 139.66it/s, loss=144][A[A[A[A[A[A[A






 30%|██▉       | 896/3000 [00:06<00:15, 139.66it/s, loss=143][A[A[A[A[A[A[A






 30%|███       | 911/3000 [00:06<00:14, 139.97it/s, loss=143][A[A[A[A[A[A[A






 30%|███       | 911/3000 [00:06<00:14, 139.97it/s, loss=144][A[A[A[A[A[A[A






 30%|███       | 911/3000 [00:06<00:14, 139.97it/s, loss=143][A[A[A[A[A[A[A






 30%|███       | 911/3000 [00:06<00:14, 139.97it/s, loss=144][A[A[A[A[A[A[A






 30%|███      

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 31%|███       | 926/3000 [00:06<00:15, 138.15it/s, loss=142][A[A[A[A[A[A[A






 31%|███       | 926/3000 [00:07<00:15, 138.15it/s, loss=142][A[A[A[A[A[A[A






 31%|███       | 926/3000 [00:07<00:15, 138.15it/s, loss=141][A[A[A[A[A[A[A






 31%|███       | 926/3000 [00:07<00:15, 138.15it/s, loss=142][A[A[A[A[A[A[A






 31%|███       | 926/3000 [00:07<00:15, 138.15it/s, loss=142][A[A[A[A[A[A[A






 31%|███       | 926/3000 [00:07<00:15, 138.15it/s, loss=142][A[A[A[A[A[A[A






 31%|███       | 926/3000 [00:07<00:15, 138.15it/s, loss=143][A[A[A[A[A[A[A






 31%|███       | 926/3000 [00:07<00:15, 138.15it/s, loss=142][A[A[A[A[A[A[A






 31%|███       | 926/3000 [00:07<00:15, 138.15it/s, loss=142][A[A[A[A[A[A[A






 31%|███       | 926/3000 [00:07<00:15, 138.15it/s, loss=141][A[A[A[A[A[A[A






 31%|███▏      | 942/3000 [00:07<00:14, 143.35it/s, loss=141][A[A[A[A[A[A[A






 31%|███▏     

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 32%|███▏      | 959/3000 [00:07<00:13, 147.18it/s, loss=141][A[A[A[A[A[A[A






 32%|███▏      | 959/3000 [00:07<00:13, 147.18it/s, loss=141][A[A[A[A[A[A[A






 32%|███▏      | 959/3000 [00:07<00:13, 147.18it/s, loss=141][A[A[A[A[A[A[A






 32%|███▏      | 959/3000 [00:07<00:13, 147.18it/s, loss=141][A[A[A[A[A[A[A






 32%|███▏      | 959/3000 [00:07<00:13, 147.18it/s, loss=141][A[A[A[A[A[A[A






 32%|███▏      | 959/3000 [00:07<00:13, 147.18it/s, loss=139][A[A[A[A[A[A[A






 32%|███▏      | 959/3000 [00:07<00:13, 147.18it/s, loss=141][A[A[A[A[A[A[A






 32%|███▏      | 959/3000 [00:07<00:13, 147.18it/s, loss=141][A[A[A[A[A[A[A






 32%|███▏      | 959/3000 [00:07<00:13, 147.18it/s, loss=141][A[A[A[A[A[A[A






 32%|███▏      | 959/3000 [00:07<00:13, 147.18it/s, loss=141][A[A[A[A[A[A[A






 32%|███▏      | 974/3000 [00:07<00:13, 146.84it/s, loss=141][A[A[A[A[A[A[A






 32%|███▏     

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 32%|███▏      | 974/3000 [00:07<00:13, 146.84it/s, loss=139][A[A[A[A[A[A[A






 32%|███▏      | 974/3000 [00:07<00:13, 146.84it/s, loss=140][A[A[A[A[A[A[A






 33%|███▎      | 989/3000 [00:07<00:15, 129.28it/s, loss=140][A[A[A[A[A[A[A






 33%|███▎      | 989/3000 [00:07<00:15, 129.28it/s, loss=140][A[A[A[A[A[A[A






 33%|███▎      | 989/3000 [00:07<00:15, 129.28it/s, loss=140][A[A[A[A[A[A[A






 33%|███▎      | 989/3000 [00:07<00:15, 129.28it/s, loss=140][A[A[A[A[A[A[A






 33%|███▎      | 989/3000 [00:07<00:15, 129.28it/s, loss=138][A[A[A[A[A[A[A






 33%|███▎      | 989/3000 [00:07<00:15, 129.28it/s, loss=140][A[A[A[A[A[A[A






 33%|███▎      | 989/3000 [00:07<00:15, 129.28it/s, loss=140][A[A[A[A[A[A[A






 33%|███▎      | 989/3000 [00:07<00:15, 129.28it/s, loss=140][A[A[A[A[A[A[A






 33%|███▎      | 989/3000 [00:07<00:15, 129.28it/s, loss=140][A[A[A[A[A[A[A






 33%|███▎     

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 33%|███▎      | 1003/3000 [00:07<00:15, 128.82it/s, loss=139][A[A[A[A[A[A[A






 33%|███▎      | 1003/3000 [00:07<00:15, 128.82it/s, loss=139][A[A[A[A[A[A[A






 33%|███▎      | 1003/3000 [00:07<00:15, 128.82it/s, loss=139][A[A[A[A[A[A[A






 33%|███▎      | 1003/3000 [00:07<00:15, 128.82it/s, loss=137][A[A[A[A[A[A[A






 33%|███▎      | 1003/3000 [00:07<00:15, 128.82it/s, loss=139][A[A[A[A[A[A[A






 34%|███▍      | 1017/3000 [00:07<00:16, 123.67it/s, loss=139][A[A[A[A[A[A[A






 34%|███▍      | 1017/3000 [00:07<00:16, 123.67it/s, loss=139][A[A[A[A[A[A[A






 34%|███▍      | 1017/3000 [00:07<00:16, 123.67it/s, loss=139][A[A[A[A[A[A[A






 34%|███▍      | 1017/3000 [00:07<00:16, 123.67it/s, loss=139][A[A[A[A[A[A[A






 34%|███▍      | 1017/3000 [00:07<00:16, 123.67it/s, loss=136][A[A[A[A[A[A[A






 34%|███▍      | 1017/3000 [00:07<00:16, 123.67it/s, loss=139][A[A[A[A[A[A[A






 34

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 34%|███▍      | 1030/3000 [00:07<00:16, 122.36it/s, loss=138][A[A[A[A[A[A[A






 34%|███▍      | 1030/3000 [00:07<00:16, 122.36it/s, loss=138][A[A[A[A[A[A[A






 34%|███▍      | 1030/3000 [00:07<00:16, 122.36it/s, loss=138][A[A[A[A[A[A[A






 34%|███▍      | 1030/3000 [00:07<00:16, 122.36it/s, loss=138][A[A[A[A[A[A[A






 34%|███▍      | 1030/3000 [00:07<00:16, 122.36it/s, loss=137][A[A[A[A[A[A[A






 34%|███▍      | 1030/3000 [00:07<00:16, 122.36it/s, loss=138][A[A[A[A[A[A[A






 34%|███▍      | 1030/3000 [00:07<00:16, 122.36it/s, loss=137][A[A[A[A[A[A[A






 34%|███▍      | 1030/3000 [00:07<00:16, 122.36it/s, loss=138][A[A[A[A[A[A[A






 35%|███▍      | 1045/3000 [00:07<00:15, 129.01it/s, loss=138][A[A[A[A[A[A[A






 35%|███▍      | 1045/3000 [00:07<00:15, 129.01it/s, loss=136][A[A[A[A[A[A[A






 35%|███▍      | 1045/3000 [00:07<00:15, 129.01it/s, loss=137][A[A[A[A[A[A[A






 35

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 35%|███▌      | 1059/3000 [00:08<00:14, 129.89it/s, loss=136][A[A[A[A[A[A[A






 35%|███▌      | 1059/3000 [00:08<00:14, 129.89it/s, loss=137][A[A[A[A[A[A[A






 35%|███▌      | 1059/3000 [00:08<00:14, 129.89it/s, loss=137][A[A[A[A[A[A[A






 35%|███▌      | 1059/3000 [00:08<00:14, 129.89it/s, loss=137][A[A[A[A[A[A[A






 35%|███▌      | 1059/3000 [00:08<00:14, 129.89it/s, loss=136][A[A[A[A[A[A[A






 35%|███▌      | 1059/3000 [00:08<00:14, 129.89it/s, loss=137][A[A[A[A[A[A[A






 35%|███▌      | 1059/3000 [00:08<00:14, 129.89it/s, loss=137][A[A[A[A[A[A[A






 35%|███▌      | 1059/3000 [00:08<00:14, 129.89it/s, loss=136][A[A[A[A[A[A[A






 35%|███▌      | 1059/3000 [00:08<00:14, 129.89it/s, loss=136][A[A[A[A[A[A[A






 36%|███▌      | 1073/3000 [00:08<00:15, 124.47it/s, loss=136][A[A[A[A[A[A[A






 36%|███▌      | 1073/3000 [00:08<00:15, 124.47it/s, loss=136][A[A[A[A[A[A[A






 36

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 36%|███▌      | 1086/3000 [00:08<00:15, 124.80it/s, loss=135][A[A[A[A[A[A[A






 36%|███▌      | 1086/3000 [00:08<00:15, 124.80it/s, loss=135][A[A[A[A[A[A[A






 36%|███▌      | 1086/3000 [00:08<00:15, 124.80it/s, loss=135][A[A[A[A[A[A[A






 36%|███▌      | 1086/3000 [00:08<00:15, 124.80it/s, loss=135][A[A[A[A[A[A[A






 36%|███▌      | 1086/3000 [00:08<00:15, 124.80it/s, loss=135][A[A[A[A[A[A[A






 36%|███▌      | 1086/3000 [00:08<00:15, 124.80it/s, loss=135][A[A[A[A[A[A[A






 36%|███▌      | 1086/3000 [00:08<00:15, 124.80it/s, loss=134][A[A[A[A[A[A[A






 36%|███▌      | 1086/3000 [00:08<00:15, 124.80it/s, loss=135][A[A[A[A[A[A[A






 36%|███▌      | 1086/3000 [00:08<00:15, 124.80it/s, loss=135][A[A[A[A[A[A[A






 37%|███▋      | 1099/3000 [00:08<00:15, 125.23it/s, loss=135][A[A[A[A[A[A[A






 37%|███▋      | 1099/3000 [00:08<00:15, 125.23it/s, loss=135][A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 37%|███▋      | 1113/3000 [00:08<00:14, 127.75it/s, loss=133][A[A[A[A[A[A[A






 37%|███▋      | 1113/3000 [00:08<00:14, 127.75it/s, loss=134][A[A[A[A[A[A[A






 37%|███▋      | 1113/3000 [00:08<00:14, 127.75it/s, loss=134][A[A[A[A[A[A[A






 37%|███▋      | 1113/3000 [00:08<00:14, 127.75it/s, loss=134][A[A[A[A[A[A[A






 37%|███▋      | 1113/3000 [00:08<00:14, 127.75it/s, loss=134][A[A[A[A[A[A[A






 37%|███▋      | 1113/3000 [00:08<00:14, 127.75it/s, loss=132][A[A[A[A[A[A[A






 37%|███▋      | 1113/3000 [00:08<00:14, 127.75it/s, loss=134][A[A[A[A[A[A[A






 37%|███▋      | 1113/3000 [00:08<00:14, 127.75it/s, loss=132][A[A[A[A[A[A[A






 37%|███▋      | 1113/3000 [00:08<00:14, 127.75it/s, loss=132][A[A[A[A[A[A[A






 37%|███▋      | 1113/3000 [00:08<00:14, 127.75it/s, loss=134][A[A[A[A[A[A[A






 37%|███▋      | 1113/3000 [00:08<00:14, 127.75it/s, loss=134][A[A[A[A[A[A[A






 37

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 38%|███▊      | 1144/3000 [00:08<00:13, 137.42it/s, loss=133][A[A[A[A[A[A[A






 38%|███▊      | 1144/3000 [00:08<00:13, 137.42it/s, loss=133][A[A[A[A[A[A[A






 38%|███▊      | 1144/3000 [00:08<00:13, 137.42it/s, loss=133][A[A[A[A[A[A[A






 38%|███▊      | 1144/3000 [00:08<00:13, 137.42it/s, loss=132][A[A[A[A[A[A[A






 38%|███▊      | 1144/3000 [00:08<00:13, 137.42it/s, loss=131][A[A[A[A[A[A[A






 38%|███▊      | 1144/3000 [00:08<00:13, 137.42it/s, loss=133][A[A[A[A[A[A[A






 38%|███▊      | 1144/3000 [00:08<00:13, 137.42it/s, loss=132][A[A[A[A[A[A[A






 38%|███▊      | 1144/3000 [00:08<00:13, 137.42it/s, loss=132][A[A[A[A[A[A[A






 38%|███▊      | 1144/3000 [00:08<00:13, 137.42it/s, loss=131][A[A[A[A[A[A[A






 38%|███▊      | 1144/3000 [00:08<00:13, 137.42it/s, loss=133][A[A[A[A[A[A[A






 38%|███▊      | 1144/3000 [00:08<00:13, 137.42it/s, loss=132][A[A[A[A[A[A[A






 38

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 39%|███▉      | 1174/3000 [00:08<00:13, 138.95it/s, loss=132][A[A[A[A[A[A[A






 39%|███▉      | 1174/3000 [00:08<00:13, 138.95it/s, loss=132][A[A[A[A[A[A[A






 39%|███▉      | 1174/3000 [00:08<00:13, 138.95it/s, loss=132][A[A[A[A[A[A[A






 39%|███▉      | 1174/3000 [00:08<00:13, 138.95it/s, loss=131][A[A[A[A[A[A[A






 39%|███▉      | 1174/3000 [00:08<00:13, 138.95it/s, loss=129][A[A[A[A[A[A[A






 39%|███▉      | 1174/3000 [00:08<00:13, 138.95it/s, loss=131][A[A[A[A[A[A[A






 39%|███▉      | 1174/3000 [00:08<00:13, 138.95it/s, loss=129][A[A[A[A[A[A[A






 39%|███▉      | 1174/3000 [00:08<00:13, 138.95it/s, loss=131][A[A[A[A[A[A[A






 39%|███▉      | 1174/3000 [00:08<00:13, 138.95it/s, loss=131][A[A[A[A[A[A[A






 39%|███▉      | 1174/3000 [00:08<00:13, 138.95it/s, loss=131][A[A[A[A[A[A[A






 39%|███▉      | 1174/3000 [00:08<00:13, 138.95it/s, loss=131][A[A[A[A[A[A[A






 39

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 40%|████      | 1204/3000 [00:09<00:12, 141.38it/s, loss=130][A[A[A[A[A[A[A






 40%|████      | 1204/3000 [00:09<00:12, 141.38it/s, loss=130][A[A[A[A[A[A[A






 40%|████      | 1204/3000 [00:09<00:12, 141.38it/s, loss=130][A[A[A[A[A[A[A






 40%|████      | 1204/3000 [00:09<00:12, 141.38it/s, loss=130][A[A[A[A[A[A[A






 40%|████      | 1204/3000 [00:09<00:12, 141.38it/s, loss=130][A[A[A[A[A[A[A






 40%|████      | 1204/3000 [00:09<00:12, 141.38it/s, loss=130][A[A[A[A[A[A[A






 40%|████      | 1204/3000 [00:09<00:12, 141.38it/s, loss=130][A[A[A[A[A[A[A






 40%|████      | 1204/3000 [00:09<00:12, 141.38it/s, loss=130][A[A[A[A[A[A[A






 40%|████      | 1204/3000 [00:09<00:12, 141.38it/s, loss=130][A[A[A[A[A[A[A






 40%|████      | 1204/3000 [00:09<00:12, 141.38it/s, loss=130][A[A[A[A[A[A[A






 40%|████      | 1204/3000 [00:09<00:12, 141.38it/s, loss=130][A[A[A[A[A[A[A






 40

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


 41%|████      | 1219/3000 [00:09<00:12, 142.10it/s, loss=129][A[A[A[A[A[A[A






 41%|████      | 1219/3000 [00:09<00:12, 142.10it/s, loss=129][A[A[A[A[A[A[A






 41%|████      | 1219/3000 [00:09<00:12, 142.10it/s, loss=129][A[A[A[A[A[A[A






 41%|████      | 1234/3000 [00:09<00:13, 129.82it/s, loss=129][A[A[A[A[A[A[A






 41%|████      | 1234/3000 [00:09<00:13, 129.82it/s, loss=129][A[A[A[A[A[A[A






 41%|████      | 1234/3000 [00:09<00:13, 129.82it/s, loss=129][A[A[A[A[A[A[A






 41%|████      | 1234/3000 [00:09<00:13, 129.82it/s, loss=128][A[A[A[A[A[A[A






 41%|████      | 1234/3000 [00:09<00:13, 129.82it/s, loss=129][A[A[A[A[A[A[A






 41%|████      | 1234/3000 [00:09<00:13, 129.82it/s, loss=129][A[A[A[A[A[A[A






 41%|████      | 1234/3000 [00:09<00:13, 129.82it/s, loss=129][A[A[A[A[A[A[A






 41%|████      | 1234/3000 [00:09<00:13, 129.82it/s, loss=128][A[A[A[A[A[A[A






 41%|████ 

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 42%|████▏     | 1249/3000 [00:09<00:13, 133.44it/s, loss=128][A[A[A[A[A[A[A






 42%|████▏     | 1249/3000 [00:09<00:13, 133.44it/s, loss=126][A[A[A[A[A[A[A






 42%|████▏     | 1249/3000 [00:09<00:13, 133.44it/s, loss=127][A[A[A[A[A[A[A






 42%|████▏     | 1264/3000 [00:09<00:12, 136.56it/s, loss=127][A[A[A[A[A[A[A






 42%|████▏     | 1264/3000 [00:09<00:12, 136.56it/s, loss=128][A[A[A[A[A[A[A






 42%|████▏     | 1264/3000 [00:09<00:12, 136.56it/s, loss=128][A[A[A[A[A[A[A






 42%|████▏     | 1264/3000 [00:09<00:12, 136.56it/s, loss=128][A[A[A[A[A[A[A






 42%|████▏     | 1264/3000 [00:09<00:12, 136.56it/s, loss=128][A[A[A[A[A[A[A






 42%|████▏     | 1264/3000 [00:09<00:12, 136.56it/s, loss=128][A[A[A[A[A[A[A






 42%|████▏     | 1264/3000 [00:09<00:12, 136.56it/s, loss=127][A[A[A[A[A[A[A






 42%|████▏     | 1264/3000 [00:09<00:12, 136.56it/s, loss=127][A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 43%|████▎     | 1278/3000 [00:09<00:12, 136.08it/s, loss=127][A[A[A[A[A[A[A






 43%|████▎     | 1278/3000 [00:09<00:12, 136.08it/s, loss=127][A[A[A[A[A[A[A






 43%|████▎     | 1278/3000 [00:09<00:12, 136.08it/s, loss=127][A[A[A[A[A[A[A






 43%|████▎     | 1278/3000 [00:09<00:12, 136.08it/s, loss=126][A[A[A[A[A[A[A






 43%|████▎     | 1292/3000 [00:09<00:13, 131.01it/s, loss=126][A[A[A[A[A[A[A






 43%|████▎     | 1292/3000 [00:09<00:13, 131.01it/s, loss=127][A[A[A[A[A[A[A






 43%|████▎     | 1292/3000 [00:09<00:13, 131.01it/s, loss=124][A[A[A[A[A[A[A






 43%|████▎     | 1292/3000 [00:09<00:13, 131.01it/s, loss=126][A[A[A[A[A[A[A






 43%|████▎     | 1292/3000 [00:09<00:13, 131.01it/s, loss=126][A[A[A[A[A[A[A






 43%|████▎     | 1292/3000 [00:09<00:13, 131.01it/s, loss=126][A[A[A[A[A[A[A






 43%|████▎     | 1292/3000 [00:09<00:13, 131.01it/s, loss=126][A[A[A[A[A[A[A






 43

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 44%|████▎     | 1306/3000 [00:09<00:13, 122.14it/s, loss=126][A[A[A[A[A[A[A






 44%|████▎     | 1306/3000 [00:09<00:13, 122.14it/s, loss=125][A[A[A[A[A[A[A






 44%|████▎     | 1306/3000 [00:09<00:13, 122.14it/s, loss=125][A[A[A[A[A[A[A






 44%|████▎     | 1306/3000 [00:09<00:13, 122.14it/s, loss=126][A[A[A[A[A[A[A






 44%|████▎     | 1306/3000 [00:09<00:13, 122.14it/s, loss=126][A[A[A[A[A[A[A






 44%|████▎     | 1306/3000 [00:09<00:13, 122.14it/s, loss=125][A[A[A[A[A[A[A






 44%|████▎     | 1306/3000 [00:09<00:13, 122.14it/s, loss=124][A[A[A[A[A[A[A






 44%|████▎     | 1306/3000 [00:09<00:13, 122.14it/s, loss=124][A[A[A[A[A[A[A






 44%|████▎     | 1306/3000 [00:09<00:13, 122.14it/s, loss=125][A[A[A[A[A[A[A






 44%|████▍     | 1319/3000 [00:09<00:13, 124.18it/s, loss=125][A[A[A[A[A[A[A






 44%|████▍     | 1319/3000 [00:09<00:13, 124.18it/s, loss=125][A[A[A[A[A[A[A






 44

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 44%|████▍     | 1332/3000 [00:10<00:13, 122.99it/s, loss=125][A[A[A[A[A[A[A






 44%|████▍     | 1332/3000 [00:10<00:13, 122.99it/s, loss=125][A[A[A[A[A[A[A






 44%|████▍     | 1332/3000 [00:10<00:13, 122.99it/s, loss=124][A[A[A[A[A[A[A






 44%|████▍     | 1332/3000 [00:10<00:13, 122.99it/s, loss=124][A[A[A[A[A[A[A






 44%|████▍     | 1332/3000 [00:10<00:13, 122.99it/s, loss=124][A[A[A[A[A[A[A






 44%|████▍     | 1332/3000 [00:10<00:13, 122.99it/s, loss=124][A[A[A[A[A[A[A






 44%|████▍     | 1332/3000 [00:10<00:13, 122.99it/s, loss=124][A[A[A[A[A[A[A






 44%|████▍     | 1332/3000 [00:10<00:13, 122.99it/s, loss=123][A[A[A[A[A[A[A






 44%|████▍     | 1332/3000 [00:10<00:13, 122.99it/s, loss=124][A[A[A[A[A[A[A






 44%|████▍     | 1332/3000 [00:10<00:13, 122.99it/s, loss=124][A[A[A[A[A[A[A






 45%|████▍     | 1346/3000 [00:10<00:13, 127.00it/s, loss=124][A[A[A[A[A[A[A






 45

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


 45%|████▍     | 1346/3000 [00:10<00:13, 127.00it/s, loss=123][A[A[A[A[A[A[A






 45%|████▌     | 1359/3000 [00:10<00:14, 114.50it/s, loss=123][A[A[A[A[A[A[A






 45%|████▌     | 1359/3000 [00:10<00:14, 114.50it/s, loss=123][A[A[A[A[A[A[A






 45%|████▌     | 1359/3000 [00:10<00:14, 114.50it/s, loss=122][A[A[A[A[A[A[A






 45%|████▌     | 1359/3000 [00:10<00:14, 114.50it/s, loss=123][A[A[A[A[A[A[A






 45%|████▌     | 1359/3000 [00:10<00:14, 114.50it/s, loss=123][A[A[A[A[A[A[A






 45%|████▌     | 1359/3000 [00:10<00:14, 114.50it/s, loss=123][A[A[A[A[A[A[A






 45%|████▌     | 1359/3000 [00:10<00:14, 114.50it/s, loss=123][A[A[A[A[A[A[A






 45%|████▌     | 1359/3000 [00:10<00:14, 114.50it/s, loss=123][A[A[A[A[A[A[A






 45%|████▌     | 1359/3000 [00:10<00:14, 114.50it/s, loss=121][A[A[A[A[A[A[A






 45%|████▌     | 1359/3000 [00:10<00:14, 114.50it/s, loss=123][A[A[A[A[A[A[A






 45%|████▌

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


 46%|████▌     | 1371/3000 [00:10<00:14, 108.69it/s, loss=121][A[A[A[A[A[A[A






 46%|████▌     | 1371/3000 [00:10<00:14, 108.69it/s, loss=122][A[A[A[A[A[A[A






 46%|████▌     | 1371/3000 [00:10<00:14, 108.69it/s, loss=122][A[A[A[A[A[A[A






 46%|████▌     | 1371/3000 [00:10<00:14, 108.69it/s, loss=122][A[A[A[A[A[A[A






 46%|████▌     | 1371/3000 [00:10<00:14, 108.69it/s, loss=120][A[A[A[A[A[A[A






 46%|████▌     | 1383/3000 [00:10<00:15, 104.31it/s, loss=120][A[A[A[A[A[A[A






 46%|████▌     | 1383/3000 [00:10<00:15, 104.31it/s, loss=122][A[A[A[A[A[A[A






 46%|████▌     | 1383/3000 [00:10<00:15, 104.31it/s, loss=122][A[A[A[A[A[A[A






 46%|████▌     | 1383/3000 [00:10<00:15, 104.31it/s, loss=122][A[A[A[A[A[A[A






 46%|████▌     | 1383/3000 [00:10<00:15, 104.31it/s, loss=122][A[A[A[A[A[A[A






 46%|████▌     | 1383/3000 [00:10<00:15, 104.31it/s, loss=122][A[A[A[A[A[A[A






 46%|████▌

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


 47%|████▋     | 1398/3000 [00:10<00:14, 114.34it/s, loss=120][A[A[A[A[A[A[A






 47%|████▋     | 1398/3000 [00:10<00:14, 114.34it/s, loss=121][A[A[A[A[A[A[A






 47%|████▋     | 1398/3000 [00:10<00:14, 114.34it/s, loss=121][A[A[A[A[A[A[A






 47%|████▋     | 1398/3000 [00:10<00:14, 114.34it/s, loss=121][A[A[A[A[A[A[A






 47%|████▋     | 1398/3000 [00:10<00:14, 114.34it/s, loss=121][A[A[A[A[A[A[A






 47%|████▋     | 1414/3000 [00:10<00:12, 123.27it/s, loss=121][A[A[A[A[A[A[A






 47%|████▋     | 1414/3000 [00:10<00:12, 123.27it/s, loss=121][A[A[A[A[A[A[A






 47%|████▋     | 1414/3000 [00:10<00:12, 123.27it/s, loss=121][A[A[A[A[A[A[A






 47%|████▋     | 1414/3000 [00:10<00:12, 123.27it/s, loss=120][A[A[A[A[A[A[A






 47%|████▋     | 1414/3000 [00:10<00:12, 123.27it/s, loss=120][A[A[A[A[A[A[A






 47%|████▋     | 1414/3000 [00:10<00:12, 123.27it/s, loss=121][A[A[A[A[A[A[A






 47%|████▋

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


 48%|████▊     | 1427/3000 [00:10<00:13, 118.85it/s, loss=120][A[A[A[A[A[A[A






 48%|████▊     | 1427/3000 [00:10<00:13, 118.85it/s, loss=119][A[A[A[A[A[A[A






 48%|████▊     | 1427/3000 [00:10<00:13, 118.85it/s, loss=120][A[A[A[A[A[A[A






 48%|████▊     | 1427/3000 [00:10<00:13, 118.85it/s, loss=120][A[A[A[A[A[A[A






 48%|████▊     | 1427/3000 [00:10<00:13, 118.85it/s, loss=120][A[A[A[A[A[A[A






 48%|████▊     | 1427/3000 [00:10<00:13, 118.85it/s, loss=120][A[A[A[A[A[A[A






 48%|████▊     | 1427/3000 [00:10<00:13, 118.85it/s, loss=120][A[A[A[A[A[A[A






 48%|████▊     | 1427/3000 [00:10<00:13, 118.85it/s, loss=118][A[A[A[A[A[A[A






 48%|████▊     | 1427/3000 [00:10<00:13, 118.85it/s, loss=120][A[A[A[A[A[A[A






 48%|████▊     | 1440/3000 [00:10<00:14, 108.09it/s, loss=120][A[A[A[A[A[A[A






 48%|████▊     | 1440/3000 [00:11<00:14, 108.09it/s, loss=120][A[A[A[A[A[A[A






 48%|████▊

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 48%|████▊     | 1453/3000 [00:11<00:13, 112.17it/s, loss=118][A[A[A[A[A[A[A






 48%|████▊     | 1453/3000 [00:11<00:13, 112.17it/s, loss=119][A[A[A[A[A[A[A






 48%|████▊     | 1453/3000 [00:11<00:13, 112.17it/s, loss=118][A[A[A[A[A[A[A






 48%|████▊     | 1453/3000 [00:11<00:13, 112.17it/s, loss=119][A[A[A[A[A[A[A






 48%|████▊     | 1453/3000 [00:11<00:13, 112.17it/s, loss=119][A[A[A[A[A[A[A






 48%|████▊     | 1453/3000 [00:11<00:13, 112.17it/s, loss=118][A[A[A[A[A[A[A






 48%|████▊     | 1453/3000 [00:11<00:13, 112.17it/s, loss=119][A[A[A[A[A[A[A






 48%|████▊     | 1453/3000 [00:11<00:13, 112.17it/s, loss=117][A[A[A[A[A[A[A






 48%|████▊     | 1453/3000 [00:11<00:13, 112.17it/s, loss=119][A[A[A[A[A[A[A






 48%|████▊     | 1453/3000 [00:11<00:13, 112.17it/s, loss=119][A[A[A[A[A[A[A






 48%|████▊     | 1453/3000 [00:11<00:13, 112.17it/s, loss=118][A[A[A[A[A[A[A






 48

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 49%|████▉     | 1467/3000 [00:11<00:13, 114.83it/s, loss=118][A[A[A[A[A[A[A






 49%|████▉     | 1467/3000 [00:11<00:13, 114.83it/s, loss=118][A[A[A[A[A[A[A






 49%|████▉     | 1479/3000 [00:11<00:13, 109.46it/s, loss=118][A[A[A[A[A[A[A






 49%|████▉     | 1479/3000 [00:11<00:13, 109.46it/s, loss=118][A[A[A[A[A[A[A






 49%|████▉     | 1479/3000 [00:11<00:13, 109.46it/s, loss=118][A[A[A[A[A[A[A






 49%|████▉     | 1479/3000 [00:11<00:13, 109.46it/s, loss=118][A[A[A[A[A[A[A






 49%|████▉     | 1479/3000 [00:11<00:13, 109.46it/s, loss=118][A[A[A[A[A[A[A






 49%|████▉     | 1479/3000 [00:11<00:13, 109.46it/s, loss=118][A[A[A[A[A[A[A






 49%|████▉     | 1479/3000 [00:11<00:13, 109.46it/s, loss=118][A[A[A[A[A[A[A






 49%|████▉     | 1479/3000 [00:11<00:13, 109.46it/s, loss=118][A[A[A[A[A[A[A






 49%|████▉     | 1479/3000 [00:11<00:13, 109.46it/s, loss=117][A[A[A[A[A[A[A






 49

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 50%|████▉     | 1491/3000 [00:11<00:13, 112.30it/s, loss=117][A[A[A[A[A[A[A






 50%|████▉     | 1491/3000 [00:11<00:13, 112.30it/s, loss=117][A[A[A[A[A[A[A






 50%|████▉     | 1491/3000 [00:11<00:13, 112.30it/s, loss=115][A[A[A[A[A[A[A






 50%|█████     | 1503/3000 [00:11<00:13, 112.32it/s, loss=115][A[A[A[A[A[A[A






 50%|█████     | 1503/3000 [00:11<00:13, 112.32it/s, loss=117][A[A[A[A[A[A[A






 50%|█████     | 1503/3000 [00:11<00:13, 112.32it/s, loss=114][A[A[A[A[A[A[A






 50%|█████     | 1503/3000 [00:11<00:13, 112.32it/s, loss=117][A[A[A[A[A[A[A






 50%|█████     | 1503/3000 [00:11<00:13, 112.32it/s, loss=116][A[A[A[A[A[A[A






 50%|█████     | 1503/3000 [00:11<00:13, 112.32it/s, loss=117][A[A[A[A[A[A[A






 50%|█████     | 1503/3000 [00:11<00:13, 112.32it/s, loss=117][A[A[A[A[A[A[A






 50%|█████     | 1503/3000 [00:11<00:13, 112.32it/s, loss=117][A[A[A[A[A[A[A






 50

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 51%|█████     | 1516/3000 [00:11<00:12, 116.49it/s, loss=116][A[A[A[A[A[A[A






 51%|█████     | 1516/3000 [00:11<00:12, 116.49it/s, loss=116][A[A[A[A[A[A[A






 51%|█████     | 1516/3000 [00:11<00:12, 116.49it/s, loss=116][A[A[A[A[A[A[A






 51%|█████     | 1529/3000 [00:11<00:12, 117.87it/s, loss=116][A[A[A[A[A[A[A






 51%|█████     | 1529/3000 [00:11<00:12, 117.87it/s, loss=116][A[A[A[A[A[A[A






 51%|█████     | 1529/3000 [00:11<00:12, 117.87it/s, loss=115][A[A[A[A[A[A[A






 51%|█████     | 1529/3000 [00:11<00:12, 117.87it/s, loss=115][A[A[A[A[A[A[A






 51%|█████     | 1529/3000 [00:11<00:12, 117.87it/s, loss=116][A[A[A[A[A[A[A






 51%|█████     | 1529/3000 [00:11<00:12, 117.87it/s, loss=115][A[A[A[A[A[A[A






 51%|█████     | 1529/3000 [00:11<00:12, 117.87it/s, loss=116][A[A[A[A[A[A[A






 51%|█████     | 1529/3000 [00:11<00:12, 117.87it/s, loss=116][A[A[A[A[A[A[A






 51

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 51%|█████▏    | 1541/3000 [00:11<00:13, 111.16it/s, loss=115][A[A[A[A[A[A[A






 51%|█████▏    | 1541/3000 [00:11<00:13, 111.16it/s, loss=115][A[A[A[A[A[A[A






 51%|█████▏    | 1541/3000 [00:11<00:13, 111.16it/s, loss=115][A[A[A[A[A[A[A






 51%|█████▏    | 1541/3000 [00:11<00:13, 111.16it/s, loss=115][A[A[A[A[A[A[A






 51%|█████▏    | 1541/3000 [00:11<00:13, 111.16it/s, loss=115][A[A[A[A[A[A[A






 51%|█████▏    | 1541/3000 [00:11<00:13, 111.16it/s, loss=115][A[A[A[A[A[A[A






 51%|█████▏    | 1541/3000 [00:11<00:13, 111.16it/s, loss=110][A[A[A[A[A[A[A






 52%|█████▏    | 1553/3000 [00:11<00:13, 107.45it/s, loss=110][A[A[A[A[A[A[A






 52%|█████▏    | 1553/3000 [00:12<00:13, 107.45it/s, loss=115][A[A[A[A[A[A[A






 52%|█████▏    | 1553/3000 [00:12<00:13, 107.45it/s, loss=115][A[A[A[A[A[A[A






 52%|█████▏    | 1553/3000 [00:12<00:13, 107.45it/s, loss=115][A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 52%|█████▏    | 1569/3000 [00:12<00:12, 117.88it/s, loss=114][A[A[A[A[A[A[A






 52%|█████▏    | 1569/3000 [00:12<00:12, 117.88it/s, loss=114][A[A[A[A[A[A[A






 52%|█████▏    | 1569/3000 [00:12<00:12, 117.88it/s, loss=114][A[A[A[A[A[A[A






 52%|█████▏    | 1569/3000 [00:12<00:12, 117.88it/s, loss=113][A[A[A[A[A[A[A






 52%|█████▏    | 1569/3000 [00:12<00:12, 117.88it/s, loss=113][A[A[A[A[A[A[A






 52%|█████▏    | 1569/3000 [00:12<00:12, 117.88it/s, loss=113][A[A[A[A[A[A[A






 52%|█████▏    | 1569/3000 [00:12<00:12, 117.88it/s, loss=110][A[A[A[A[A[A[A






 52%|█████▏    | 1569/3000 [00:12<00:12, 117.88it/s, loss=113][A[A[A[A[A[A[A






 53%|█████▎    | 1582/3000 [00:12<00:12, 112.32it/s, loss=113][A[A[A[A[A[A[A






 53%|█████▎    | 1582/3000 [00:12<00:12, 112.32it/s, loss=114][A[A[A[A[A[A[A






 53%|█████▎    | 1582/3000 [00:12<00:12, 112.32it/s, loss=113][A[A[A[A[A[A[A






 53

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 53%|█████▎    | 1582/3000 [00:12<00:12, 112.32it/s, loss=113][A[A[A[A[A[A[A






 53%|█████▎    | 1582/3000 [00:12<00:12, 112.32it/s, loss=113][A[A[A[A[A[A[A






 53%|█████▎    | 1582/3000 [00:12<00:12, 112.32it/s, loss=113][A[A[A[A[A[A[A






 53%|█████▎    | 1582/3000 [00:12<00:12, 112.32it/s, loss=113][A[A[A[A[A[A[A






 53%|█████▎    | 1594/3000 [00:12<00:13, 101.89it/s, loss=113][A[A[A[A[A[A[A






 53%|█████▎    | 1594/3000 [00:12<00:13, 101.89it/s, loss=113][A[A[A[A[A[A[A






 53%|█████▎    | 1594/3000 [00:12<00:13, 101.89it/s, loss=111][A[A[A[A[A[A[A






 53%|█████▎    | 1594/3000 [00:12<00:13, 101.89it/s, loss=109][A[A[A[A[A[A[A






 53%|█████▎    | 1594/3000 [00:12<00:13, 101.89it/s, loss=113][A[A[A[A[A[A[A






 53%|█████▎    | 1594/3000 [00:12<00:13, 101.89it/s, loss=111][A[A[A[A[A[A[A






 53%|█████▎    | 1594/3000 [00:12<00:13, 101.89it/s, loss=113][A[A[A[A[A[A[A






 53

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 54%|█████▎    | 1607/3000 [00:12<00:12, 108.90it/s, loss=112][A[A[A[A[A[A[A






 54%|█████▎    | 1607/3000 [00:12<00:12, 108.90it/s, loss=112][A[A[A[A[A[A[A






 54%|█████▎    | 1607/3000 [00:12<00:12, 108.90it/s, loss=110][A[A[A[A[A[A[A






 54%|█████▎    | 1607/3000 [00:12<00:12, 108.90it/s, loss=111][A[A[A[A[A[A[A






 54%|█████▍    | 1622/3000 [00:12<00:11, 118.43it/s, loss=111][A[A[A[A[A[A[A






 54%|█████▍    | 1622/3000 [00:12<00:11, 118.43it/s, loss=111][A[A[A[A[A[A[A






 54%|█████▍    | 1622/3000 [00:12<00:11, 118.43it/s, loss=112][A[A[A[A[A[A[A






 54%|█████▍    | 1622/3000 [00:12<00:11, 118.43it/s, loss=112][A[A[A[A[A[A[A






 54%|█████▍    | 1622/3000 [00:12<00:11, 118.43it/s, loss=112][A[A[A[A[A[A[A






 54%|█████▍    | 1622/3000 [00:12<00:11, 118.43it/s, loss=112][A[A[A[A[A[A[A






 54%|█████▍    | 1622/3000 [00:12<00:11, 118.43it/s, loss=111][A[A[A[A[A[A[A






 54

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 55%|█████▍    | 1636/3000 [00:12<00:11, 123.93it/s, loss=110][A[A[A[A[A[A[A






 55%|█████▍    | 1636/3000 [00:12<00:11, 123.93it/s, loss=110][A[A[A[A[A[A[A






 55%|█████▍    | 1636/3000 [00:12<00:11, 123.93it/s, loss=110][A[A[A[A[A[A[A






 55%|█████▍    | 1636/3000 [00:12<00:11, 123.93it/s, loss=110][A[A[A[A[A[A[A






 55%|█████▌    | 1650/3000 [00:12<00:10, 125.67it/s, loss=110][A[A[A[A[A[A[A






 55%|█████▌    | 1650/3000 [00:12<00:10, 125.67it/s, loss=110][A[A[A[A[A[A[A






 55%|█████▌    | 1650/3000 [00:12<00:10, 125.67it/s, loss=110][A[A[A[A[A[A[A






 55%|█████▌    | 1650/3000 [00:12<00:10, 125.67it/s, loss=110][A[A[A[A[A[A[A






 55%|█████▌    | 1650/3000 [00:12<00:10, 125.67it/s, loss=110][A[A[A[A[A[A[A






 55%|█████▌    | 1650/3000 [00:12<00:10, 125.67it/s, loss=110][A[A[A[A[A[A[A






 55%|█████▌    | 1650/3000 [00:12<00:10, 125.67it/s, loss=110][A[A[A[A[A[A[A






 55

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 55%|█████▌    | 1664/3000 [00:12<00:10, 128.07it/s, loss=109][A[A[A[A[A[A[A






 55%|█████▌    | 1664/3000 [00:12<00:10, 128.07it/s, loss=109][A[A[A[A[A[A[A






 55%|█████▌    | 1664/3000 [00:12<00:10, 128.07it/s, loss=109][A[A[A[A[A[A[A






 55%|█████▌    | 1664/3000 [00:12<00:10, 128.07it/s, loss=106][A[A[A[A[A[A[A






 55%|█████▌    | 1664/3000 [00:12<00:10, 128.07it/s, loss=109][A[A[A[A[A[A[A






 56%|█████▌    | 1678/3000 [00:12<00:10, 128.96it/s, loss=109][A[A[A[A[A[A[A






 56%|█████▌    | 1678/3000 [00:13<00:10, 128.96it/s, loss=109][A[A[A[A[A[A[A






 56%|█████▌    | 1678/3000 [00:13<00:10, 128.96it/s, loss=109][A[A[A[A[A[A[A






 56%|█████▌    | 1678/3000 [00:13<00:10, 128.96it/s, loss=109][A[A[A[A[A[A[A






 56%|█████▌    | 1678/3000 [00:13<00:10, 128.96it/s, loss=109][A[A[A[A[A[A[A






 56%|█████▌    | 1678/3000 [00:13<00:10, 128.96it/s, loss=109][A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 56%|█████▋    | 1694/3000 [00:13<00:09, 135.89it/s, loss=108][A[A[A[A[A[A[A






 56%|█████▋    | 1694/3000 [00:13<00:09, 135.89it/s, loss=107][A[A[A[A[A[A[A






 56%|█████▋    | 1694/3000 [00:13<00:09, 135.89it/s, loss=107][A[A[A[A[A[A[A






 56%|█████▋    | 1694/3000 [00:13<00:09, 135.89it/s, loss=105][A[A[A[A[A[A[A






 56%|█████▋    | 1694/3000 [00:13<00:09, 135.89it/s, loss=108][A[A[A[A[A[A[A






 56%|█████▋    | 1694/3000 [00:13<00:09, 135.89it/s, loss=108][A[A[A[A[A[A[A






 56%|█████▋    | 1694/3000 [00:13<00:09, 135.89it/s, loss=106][A[A[A[A[A[A[A






 57%|█████▋    | 1710/3000 [00:13<00:09, 140.51it/s, loss=106][A[A[A[A[A[A[A






 57%|█████▋    | 1710/3000 [00:13<00:09, 140.51it/s, loss=107][A[A[A[A[A[A[A






 57%|█████▋    | 1710/3000 [00:13<00:09, 140.51it/s, loss=108][A[A[A[A[A[A[A






 57%|█████▋    | 1710/3000 [00:13<00:09, 140.51it/s, loss=107][A[A[A[A[A[A[A






 57

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 57%|█████▊    | 1725/3000 [00:13<00:09, 132.41it/s, loss=107][A[A[A[A[A[A[A






 57%|█████▊    | 1725/3000 [00:13<00:09, 132.41it/s, loss=107][A[A[A[A[A[A[A






 57%|█████▊    | 1725/3000 [00:13<00:09, 132.41it/s, loss=107][A[A[A[A[A[A[A






 57%|█████▊    | 1725/3000 [00:13<00:09, 132.41it/s, loss=107][A[A[A[A[A[A[A






 57%|█████▊    | 1725/3000 [00:13<00:09, 132.41it/s, loss=106][A[A[A[A[A[A[A






 57%|█████▊    | 1725/3000 [00:13<00:09, 132.41it/s, loss=107][A[A[A[A[A[A[A






 57%|█████▊    | 1725/3000 [00:13<00:09, 132.41it/s, loss=107][A[A[A[A[A[A[A






 57%|█████▊    | 1725/3000 [00:13<00:09, 132.41it/s, loss=106][A[A[A[A[A[A[A






 57%|█████▊    | 1725/3000 [00:13<00:09, 132.41it/s, loss=104][A[A[A[A[A[A[A






 57%|█████▊    | 1725/3000 [00:13<00:09, 132.41it/s, loss=106][A[A[A[A[A[A[A






 57%|█████▊    | 1725/3000 [00:13<00:09, 132.41it/s, loss=107][A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 58%|█████▊    | 1739/3000 [00:13<00:10, 124.35it/s, loss=106][A[A[A[A[A[A[A






 58%|█████▊    | 1752/3000 [00:13<00:10, 118.40it/s, loss=106][A[A[A[A[A[A[A






 58%|█████▊    | 1752/3000 [00:13<00:10, 118.40it/s, loss=106][A[A[A[A[A[A[A






 58%|█████▊    | 1752/3000 [00:13<00:10, 118.40it/s, loss=105][A[A[A[A[A[A[A






 58%|█████▊    | 1752/3000 [00:13<00:10, 118.40it/s, loss=106][A[A[A[A[A[A[A






 58%|█████▊    | 1752/3000 [00:13<00:10, 118.40it/s, loss=106][A[A[A[A[A[A[A






 58%|█████▊    | 1752/3000 [00:13<00:10, 118.40it/s, loss=105][A[A[A[A[A[A[A






 58%|█████▊    | 1752/3000 [00:13<00:10, 118.40it/s, loss=105][A[A[A[A[A[A[A






 58%|█████▊    | 1752/3000 [00:13<00:10, 118.40it/s, loss=106][A[A[A[A[A[A[A






 58%|█████▊    | 1752/3000 [00:13<00:10, 118.40it/s, loss=105][A[A[A[A[A[A[A






 58%|█████▊    | 1752/3000 [00:13<00:10, 118.40it/s, loss=104][A[A[A[A[A[A[A






 58

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2

 59%|█████▉    | 1768/3000 [00:13<00:09, 128.22it/s, loss=104][A[A[A[A[A[A[A






 59%|█████▉    | 1768/3000 [00:13<00:09, 128.22it/s, loss=104][A[A[A[A[A[A[A






 60%|█████▉    | 1785/3000 [00:13<00:08, 136.57it/s, loss=104][A[A[A[A[A[A[A






 60%|█████▉    | 1785/3000 [00:13<00:08, 136.57it/s, loss=104][A[A[A[A[A[A[A






 60%|█████▉    | 1785/3000 [00:13<00:08, 136.57it/s, loss=104][A[A[A[A[A[A[A






 60%|█████▉    | 1785/3000 [00:13<00:08, 136.57it/s, loss=104][A[A[A[A[A[A[A






 60%|█████▉    | 1785/3000 [00:13<00:08, 136.57it/s, loss=104][A[A[A[A[A[A[A






 60%|█████▉    | 1785/3000 [00:13<00:08, 136.57it/s, loss=104][A[A[A[A[A[A[A






 60%|█████▉    | 1785/3000 [00:13<00:08, 136.57it/s, loss=104][A[A[A[A[A[A[A






 60%|█████▉    | 1785/3000 [00:13<00:08, 136.57it/s, loss=104][A[A[A[A[A[A[A






 60%|█████▉    | 1785/3000 [00:13<00:08, 136.57it/s, loss=104][A[A[A[A[A[A[A






 60%|█████

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 60%|██████    | 1801/3000 [00:13<00:08, 141.53it/s, loss=103][A[A[A[A[A[A[A






 60%|██████    | 1801/3000 [00:13<00:08, 141.53it/s, loss=103][A[A[A[A[A[A[A






 61%|██████    | 1818/3000 [00:13<00:08, 147.13it/s, loss=103][A[A[A[A[A[A[A






 61%|██████    | 1818/3000 [00:14<00:08, 147.13it/s, loss=103][A[A[A[A[A[A[A






 61%|██████    | 1818/3000 [00:14<00:08, 147.13it/s, loss=103][A[A[A[A[A[A[A






 61%|██████    | 1818/3000 [00:14<00:08, 147.13it/s, loss=102][A[A[A[A[A[A[A






 61%|██████    | 1818/3000 [00:14<00:08, 147.13it/s, loss=103][A[A[A[A[A[A[A






 61%|██████    | 1818/3000 [00:14<00:08, 147.13it/s, loss=103][A[A[A[A[A[A[A






 61%|██████    | 1818/3000 [00:14<00:08, 147.13it/s, loss=103][A[A[A[A[A[A[A






 61%|██████    | 1818/3000 [00:14<00:08, 147.13it/s, loss=100][A[A[A[A[A[A[A






 61%|██████    | 1818/3000 [00:14<00:08, 147.13it/s, loss=102][A[A[A

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 61%|██████    | 1834/3000 [00:14<00:09, 124.61it/s, loss=102][A[A[A[A[A[A[A






 61%|██████    | 1834/3000 [00:14<00:09, 124.61it/s, loss=102][A[A[A[A[A[A[A






 61%|██████    | 1834/3000 [00:14<00:09, 124.61it/s, loss=102][A[A[A[A[A[A[A






 61%|██████    | 1834/3000 [00:14<00:09, 124.61it/s, loss=102][A[A[A[A[A[A[A






 61%|██████    | 1834/3000 [00:14<00:09, 124.61it/s, loss=101][A[A[A[A[A[A[A






 61%|██████    | 1834/3000 [00:14<00:09, 124.61it/s, loss=102][A[A[A[A[A[A[A






 61%|██████    | 1834/3000 [00:14<00:09, 124.61it/s, loss=102][A[A[A[A[A[A[A






 61%|██████    | 1834/3000 [00:14<00:09, 124.61it/s, loss=102][A[A[A[A[A[A[A






 61%|██████    | 1834/3000 [00:14<00:09, 124.61it/s, loss=99.2][A[A[A[A[A[A[A






 61%|██████    | 1834/3000 [00:14<00:09, 124.61it/s, loss=102] [A[A[A[A[A[A[A






 61%|██████    | 1834/3000 [00:14<00:09, 124.61it/s, loss=102][A[A[

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


[A[A[A[A[A[A[A






 62%|██████▏   | 1865/3000 [00:14<00:08, 136.66it/s, loss=100][A[A[A[A[A[A[A






 62%|██████▏   | 1865/3000 [00:14<00:08, 136.66it/s, loss=101][A[A[A[A[A[A[A






 62%|██████▏   | 1865/3000 [00:14<00:08, 136.66it/s, loss=100][A[A[A[A[A[A[A






 62%|██████▏   | 1865/3000 [00:14<00:08, 136.66it/s, loss=101][A[A[A[A[A[A[A






 62%|██████▏   | 1865/3000 [00:14<00:08, 136.66it/s, loss=99.3][A[A[A[A[A[A[A






 62%|██████▏   | 1865/3000 [00:14<00:08, 136.66it/s, loss=100] [A[A[A[A[A[A[A






 62%|██████▏   | 1865/3000 [00:14<00:08, 136.66it/s, loss=100][A[A[A[A[A[A[A






 62%|██████▏   | 1865/3000 [00:14<00:08, 136.66it/s, loss=100][A[A[A[A[A[A[A






 62%|██████▏   | 1865/3000 [00:14<00:08, 136.66it/s, loss=100][A[A[A[A[A[A[A






 62%|██████▏   | 1865/3000 [00:14<00:08, 136.66it/s, loss=100][A[A[A[A[A[A[A






 62%|██████▏   | 1865/3000 [00:14<00:08, 136.66it/s, loss=100][A[A[

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


 63%|██████▎   | 1895/3000 [00:14<00:08, 137.98it/s, loss=99.4][A[A[A[A[A[A[A






 63%|██████▎   | 1895/3000 [00:14<00:08, 137.98it/s, loss=99.4][A[A[A[A[A[A[A






 63%|██████▎   | 1895/3000 [00:14<00:08, 137.98it/s, loss=98.9][A[A[A[A[A[A[A






 63%|██████▎   | 1895/3000 [00:14<00:08, 137.98it/s, loss=99.3][A[A[A[A[A[A[A






 63%|██████▎   | 1895/3000 [00:14<00:08, 137.98it/s, loss=98.6][A[A[A[A[A[A[A






 63%|██████▎   | 1895/3000 [00:14<00:08, 137.98it/s, loss=99.2][A[A[A[A[A[A[A






 63%|██████▎   | 1895/3000 [00:14<00:08, 137.98it/s, loss=99.1][A[A[A[A[A[A[A






 63%|██████▎   | 1895/3000 [00:14<00:08, 137.98it/s, loss=99]  [A[A[A[A[A[A[A






 63%|██████▎   | 1895/3000 [00:14<00:08, 137.98it/s, loss=98.7][A[A[A[A[A[A[A






 63%|██████▎   | 1895/3000 [00:14<00:08, 137.98it/s, loss=98.9][A[A[A[A[A[A[A






 63%|██████▎   | 1895/3000 [00:14<00:08, 137.98it/s, loss=99]  [A[A[A[A[A[A[A







tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 64%|██████▎   | 1910/3000 [00:14<00:07, 140.50it/s, loss=96.8][A[A[A[A[A[A[A






 64%|██████▎   | 1910/3000 [00:14<00:07, 140.50it/s, loss=95.8][A[A[A[A[A[A[A






 64%|██████▍   | 1925/3000 [00:14<00:08, 130.17it/s, loss=95.8][A[A[A[A[A[A[A






 64%|██████▍   | 1925/3000 [00:14<00:08, 130.17it/s, loss=98]  [A[A[A[A[A[A[A






 64%|██████▍   | 1925/3000 [00:14<00:08, 130.17it/s, loss=96.5][A[A[A[A[A[A[A






 64%|██████▍   | 1925/3000 [00:14<00:08, 130.17it/s, loss=98]  [A[A[A[A[A[A[A






 64%|██████▍   | 1925/3000 [00:14<00:08, 130.17it/s, loss=97.8][A[A[A[A[A[A[A






 64%|██████▍   | 1925/3000 [00:14<00:08, 130.17it/s, loss=97.7][A[A[A[A[A[A[A






 64%|██████▍   | 1925/3000 [00:14<00:08, 130.17it/s, loss=97.6][A[A[A[A[A[A[A






 64%|██████▍   | 1925/3000 [00:14<00:08, 130.17it/s, loss=97.7][A[A[A[A[A[A[A






 64%|██████▍   | 1925/3000 [00:14<00:08, 130.17it/s, loss=97.6][A[A[A[A[A[A[

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)









 65%|██████▍   | 1939/3000 [00:15<00:08, 118.45it/s, loss=97.2][A[A[A[A[A[A[A






 65%|██████▍   | 1939/3000 [00:15<00:08, 118.45it/s, loss=97.1][A[A[A[A[A[A[A






 65%|██████▍   | 1939/3000 [00:15<00:08, 118.45it/s, loss=97.3][A[A[A[A[A[A[A






 65%|██████▍   | 1939/3000 [00:15<00:08, 118.45it/s, loss=96.8][A[A[A[A[A[A[A






 65%|██████▍   | 1939/3000 [00:15<00:08, 118.45it/s, loss=96]  [A[A[A[A[A[A[A






 65%|██████▍   | 1939/3000 [00:15<00:08, 118.45it/s, loss=96.6][A[A[A[A[A[A[A






 65%|██████▍   | 1939/3000 [00:15<00:08, 118.45it/s, loss=92.9][A[A[A[A[A[A[A






 65%|██████▍   | 1939/3000 [00:15<00:08, 118.45it/s, loss=96.4][A[A[A[A[A[A[A






 65%|██████▍   | 1939/3000 [00:15<00:08, 118.45it/s, loss=97]  [A[A[A[A[A[A[A






 65%|██████▍   | 1939/3000 [00:15<00:08, 118.45it/s, loss=95.2][A[A[A[A[A[A[A






 65%|██████▌   | 1952/3000 [00:15<00:09, 106.58it/s, loss=95.2][A[A[A[A[A[A[

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)


 65%|██████▌   | 1952/3000 [00:15<00:09, 106.58it/s, loss=96]  [A[A[A[A[A[A[A






 65%|██████▌   | 1952/3000 [00:15<00:09, 106.58it/s, loss=96.4][A[A[A[A[A[A[A






 65%|██████▌   | 1952/3000 [00:15<00:09, 106.58it/s, loss=95.1][A[A[A[A[A[A[A






 65%|██████▌   | 1952/3000 [00:15<00:09, 106.58it/s, loss=95.6][A[A[A[A[A[A[A






 65%|██████▌   | 1964/3000 [00:15<00:09, 105.89it/s, loss=95.6][A[A[A[A[A[A[A






 65%|██████▌   | 1964/3000 [00:15<00:09, 105.89it/s, loss=96.4][A[A[A[A[A[A[A






 65%|██████▌   | 1964/3000 [00:15<00:09, 105.89it/s, loss=95.9][A[A[A[A[A[A[A






 65%|██████▌   | 1964/3000 [00:15<00:09, 105.89it/s, loss=95]  [A[A[A[A[A[A[A






 65%|██████▌   | 1964/3000 [00:15<00:09, 105.89it/s, loss=96][A[A[A[A[A[A[A






 65%|██████▌   | 1964/3000 [00:15<00:09, 105.89it/s, loss=96][A[A[A[A[A[A[A






 65%|██████▌   | 1964/3000 [00:15<00:09, 105.89it/s, loss=96.1][A[A[A[A[A[A[A






 65

tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(2., requires_grad=True)
tensor(nan, requires_grad=True)


ValueError: The parameter loc has invalid values
Trace Shapes:
 Param Sites:
   mean(0, 0)
  scale(0, 0)
Sample Sites:








 65%|██████▌   | 1964/3000 [00:34<00:09, 105.89it/s, loss=nan][A[A[A[A[A[A[A

In [10]:
divided_data = div_by_category(X_train, Y_train)

adam_params = {"lr": 0.5}
optimizer = pyro.optim.Adam(adam_params)
svi = SVI(model, guide, optimizer, loss=Trace_ELBO())

n_steps = 2501
for step in range(n_steps):
    svi.step(divided_data[(2, 2)], (2,2))
    if step % 100 == 0:
        print_progress()


ValueError: Error while computing log_prob at site 'prob(2, 2)':
The value argument to log_prob must be a Tensor
  Trace Shapes:     
   Param Sites:     
  Sample Sites:     
prob(2, 2) dist 33 |
          value 33 |

In [None]:
pyro.clear_param_store()
type("ad")

In [None]:
for i in range(1, 10):
    print(pyro.sample('test', dist.Normal(torch.zeros(1, 1), 1.).independent(1)))

In [None]:
for i in range(1, 10):
    print(pyro.sample('test', dist.Normal(torch.zeros(1, 1), 1.).to_event(1)))