In [27]:
# Import dependency 
import numpy as np 
import torch 
import torch.optim as optim
import torch.nn as nn 

In [28]:
# Data generation 
true_b = 1
true_w = 2 
N = 100

# set the random seed for numpy 
np.random.seed(43)

x= np.random.rand(N,1)
epsilon = (.1 * np.random.rand(N,1))

y = true_b + true_w *x + epsilon

In [29]:
#Generate training and validating sets
idx = np.arange(N)

# Use first 80 random indices for train 
train_idx = idx[:int(N*.8)]
val_idx = idx[int(N*.8):]

# Generate train and validation sets
x_train, y_train = x[train_idx], y[train_idx]


In [30]:
# Data preparation 

device = 'cuda' if torch.cuda.is_available() else 'cpu'

# Transform data from numpy array to torch tensor
x_train_tensor = torch.as_tensor(x_train).float().to(device)
y_train_tensor = torch.as_tensor(y_train).float().to(device)

In [31]:
# Build a Dataset
from torch.utils.data import Dataset

class CustomDataset(Dataset):
    def __init__(self, x_tensor, y_tensor):
        self.x = x_tensor
        self.y = y_tensor
    
    def __getitem__(self, index):
        return (self.x[index], self.y[index])
    
    def __len__(self):
        return len(self.x)

train_data = CustomDataset(x_train_tensor, y_train_tensor)
print(train_data[0])
print(len(train_data))

(tensor([0.1151]), tensor([1.2404]))
80


In [32]:
from torch.utils.data import DataLoader

# Build a data loader that yields mini-batches of size 2
train_loader = DataLoader(
        dataset=train_data,
        batch_size=2,
        shuffle=True
)
print(train_loader)

<torch.utils.data.dataloader.DataLoader object at 0x7f97f0bc4190>


In [33]:
print(next(iter(train_loader)))

[tensor([[0.6701],
        [0.2544]]), tensor([[2.4077],
        [1.6011]])]


In [34]:
#Define the train step

def make_train_step(model, loss_fn, optimizer):
    # Builds function that performs a step in the train loop 
    def perform_train_step(x,y):
        
        # Set the model to TRAIN mode
        model.train()
        
        # Step1: Compute the model's predicition - forward pass
        yhat = model(x)
        
        # Step2: Compute the loss
        loss = loss_fn(yhat, y)
        
        # Step3: Compute gradients for "b" and "w" parameters
        loss.backward()
        
        # Step4: Updates parameters using gradients and the learning rate
        optimizer.step()
        optimizer.zero_grad()
        
        #print(model.state_dict())
        # Return the loss 
        return loss.item()
    #Return the function that will be called inside the train loop
    return perform_train_step

In [35]:
# Model config 

# Define the model 
class ManualLinearRegression(nn.Module):
    def __init__(self):
        super().__init__()
        self.linear = nn.Linear(1,1)
    def forward(self,x):
        return self.linear(x)


# Set learning rate 
lr = 0.1

torch.manual_seed(42)

# Create a model and send it to the device 
model = ManualLinearRegression().to(device)
print(model.state_dict())

# Define a SGD optimizer to update the parameters 
optimizer = torch.optim.SGD(model.parameters(), lr=lr)

# Define a MSE loss function 
loss_fn = nn.MSELoss(reduction="mean")


# Create a train_step 
train_step = make_train_step(model, loss_fn, optimizer)

OrderedDict([('linear.weight', tensor([[0.7645]])), ('linear.bias', tensor([0.8300]))])


In [36]:
# Model training

n_epochs = 1000
losses = []
for epoch in range(n_epochs):
    
    # Add the inner loop to fetch the data
    mini_batch_losses = []
    for x_batch, y_batch in train_loader:
        #The dataset "lives" in the CPU, so do our mini-batches
        # we need send to mini-batches to the device 
        x_batch = x_batch.to(device)
        y_batch = y_batch.to(device)
        
        # Performs one train step and returns the corresonding loss 
        mini_batch_loss = train_step(x_batch, y_batch)
        mini_batch_losses.append(mini_batch_loss)
        
        
    # Compute average loss over all mini-batches
    loss = np.mean(mini_batch_loss)
    losses.append(loss)
   

OrderedDict([('linear.weight', tensor([[0.9270]])), ('linear.bias', tensor([1.0402]))])
OrderedDict([('linear.weight', tensor([[0.9615]])), ('linear.bias', tensor([1.1255]))])
OrderedDict([('linear.weight', tensor([[1.0181]])), ('linear.bias', tensor([1.2145]))])
OrderedDict([('linear.weight', tensor([[1.0480]])), ('linear.bias', tensor([1.2750]))])
OrderedDict([('linear.weight', tensor([[1.1444]])), ('linear.bias', tensor([1.3914]))])
OrderedDict([('linear.weight', tensor([[1.1813]])), ('linear.bias', tensor([1.4218]))])
OrderedDict([('linear.weight', tensor([[1.1819]])), ('linear.bias', tensor([1.4188]))])
OrderedDict([('linear.weight', tensor([[1.2366]])), ('linear.bias', tensor([1.4812]))])
OrderedDict([('linear.weight', tensor([[1.2485]])), ('linear.bias', tensor([1.4505]))])
OrderedDict([('linear.weight', tensor([[1.2436]])), ('linear.bias', tensor([1.3844]))])
OrderedDict([('linear.weight', tensor([[1.2379]])), ('linear.bias', tensor([1.3640]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9659]])), ('linear.bias', tensor([1.0718]))])
OrderedDict([('linear.weight', tensor([[1.9689]])), ('linear.bias', tensor([1.0739]))])
OrderedDict([('linear.weight', tensor([[1.9681]])), ('linear.bias', tensor([1.0715]))])
OrderedDict([('linear.weight', tensor([[1.9714]])), ('linear.bias', tensor([1.0785]))])
OrderedDict([('linear.weight', tensor([[1.9691]])), ('linear.bias', tensor([1.0685]))])
OrderedDict([('linear.weight', tensor([[1.9671]])), ('linear.bias', tensor([1.0621]))])
OrderedDict([('linear.weight', tensor([[1.9684]])), ('linear.bias', tensor([1.0639]))])
OrderedDict([('linear.weight', tensor([[1.9668]])), ('linear.bias', tensor([1.0613]))])
OrderedDict([('linear.weight', tensor([[1.9693]])), ('linear.bias', tensor([1.0666]))])
OrderedDict([('linear.weight', tensor([[1.9672]])), ('linear.bias', tensor([1.0610]))])
OrderedDict([('linear.weight', tensor([[1.9653]])), ('linear.bias', tensor([1.0566]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0474]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0468]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0477]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0538]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0583]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0603]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0486]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0490]))])
OrderedDict([('linear.weight', tensor([[2.0018]])), ('linear.bias', tensor([1.0529]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0055]])), ('linear.bias', tensor([1.0495]))])
OrderedDict([('linear.weight', tensor([[2.0052]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', tensor([[2.0043]])), ('linear.bias', tensor([1.0427]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0402]))])
OrderedDict([('linear.weight', tensor([[2.0090]])), ('linear.bias', tensor([1.0510]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0443]))])
OrderedDict([('linear.weight', tensor([[2.0073]])), ('linear.bias', tensor([1.0489]))])
OrderedDict([('linear.weight', tensor([[2.0053]])), ('linear.bias', tensor([1.0510]))])
OrderedDict([('linear.weight', tensor([[2.0049]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0433]))])
OrderedDict([('linear.weight', tensor([[2.0018]])), ('linear.bias', tensor([1.0455]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0048]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0493]))])
OrderedDict([('linear.weight', tensor([[2.0044]])), ('linear.bias', tensor([1.0531]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[2.0053]])), ('linear.bias', tensor([1.0522]))])
OrderedDict([('linear.weight', tensor([[2.0068]])), ('linear.bias', tensor([1.0576]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0519]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', tensor([[2.0047]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[2.0040]])), ('linear.bias', tensor([1.0568]))])
OrderedDict([('linear.weight', tensor([[2.0036]])), ('linear.bias', tensor([1.0579]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0419]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[1.9957]])), ('linear.bias', tensor([1.0400]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0468]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0454]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0513]))])
OrderedDict([('linear.weight', tensor([[2.0043]])), ('linear.bias', tensor([1.0519]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0036]])), ('linear.bias', tensor([1.0495]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[2.0023]])), ('linear.bias', tensor([1.0481]))])
OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0398]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0422]))])
OrderedDict([('linear.weight', tensor([[2.0024]])), ('linear.bias', tensor([1.0439]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0427]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0418]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0395]))])
OrderedDict([('linear.weight', tensor([[2.0054]])), ('linear.bias', tensor([1.0459]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0370]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0505]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0595]))])
OrderedDict([('linear.weight', tensor([[1.9950]])), ('linear.bias', tensor([1.0533]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0570]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0617]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0615]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0541]))])
OrderedDict([('linear.weight', tensor([[1.9985]])), ('linear.bias', tensor([1.0490]))])
OrderedDict([('linear.weight', tensor([[1.9934]])), ('linear.bias', tensor([1.0396]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0485]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0566]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0583]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0603]))])
OrderedDict([('linear.weight', tensor([[2.0014]])), ('linear.bias', tensor([1.0601]))])
OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0496]))])
OrderedDict([('linear.weight', tensor([[1.9996]])), ('linear.bias', tensor([1.0503]))])
OrderedDict([('linear.weight', tensor([[1.9958]])), ('linear.bias', tensor([1.0425]))])
OrderedDict([('linear.weight', tensor([[1.9962]])), ('linear.bias', tensor([1.0432]))])
OrderedDict([('linear.weight', tensor([[1.9996]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0468]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0460]))])
OrderedDict([('linear.weight', tensor([[1.9922]])), ('linear.bias', tensor([1.0415]))])
OrderedDict([('linear.weight', tensor([[1.9944]])), ('linear.bias', tensor([1.0425]))])
OrderedDict([('linear.weight', tensor([[1.9996]])), ('linear.bias', tensor([1.0497]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0490]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0486]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0511]))])
OrderedDict([('linear.weight', tensor([[1.9987]])), ('linear.bias', tensor([1.0567]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0037]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[2.0080]])), ('linear.bias', tensor([1.0582]))])
OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0510]))])
OrderedDict([('linear.weight', tensor([[2.0033]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[2.0042]])), ('linear.bias', tensor([1.0569]))])
OrderedDict([('linear.weight', tensor([[2.0053]])), ('linear.bias', tensor([1.0612]))])
OrderedDict([('linear.weight', tensor([[2.0039]])), ('linear.bias', tensor([1.0598]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0590]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0605]))])
OrderedDict([('linear.weight', tensor([[2.0023]])), ('linear.bias', tensor([1.0548]))])
OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0543]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0045]])), ('linear.bias', tensor([1.0548]))])
OrderedDict([('linear.weight', tensor([[2.0038]])), ('linear.bias', tensor([1.0544]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0538]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0570]))])
OrderedDict([('linear.weight', tensor([[2.0092]])), ('linear.bias', tensor([1.0648]))])
OrderedDict([('linear.weight', tensor([[2.0067]])), ('linear.bias', tensor([1.0651]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0582]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0548]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0566]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0504]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0477]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0580]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0599]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0641]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0663]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0648]))])
OrderedDict([('linear.weight', tensor([[2.0013]])), ('linear.bias', tensor([1.0590]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', tensor([[2.0019]])), ('linear.bias', tensor([1.0595]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0630]))])
OrderedDict([('linear.weight', tensor([[2.0021]])), ('linear.bias', tensor([1.0586]))])
OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[1.9946]])), ('linear.bias', tensor([1.0497]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0539]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', tensor([[1.9964]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0612]))])
OrderedDict([('linear.weight', tensor([[1.9939]])), ('linear.bias', tensor([1.0546]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0603]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0592]))])
OrderedDict([('linear.weight', tensor([[2.0021]])), ('linear.bias', tensor([1.0650]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0580]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0501]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0507]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0507]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0540]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0565]))])
OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0045]])), ('linear.bias', tensor([1.0612]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0592]))])
OrderedDict([('linear.weight', tensor([[2.0018]])), ('linear.bias', tensor([1.0583]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0575]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0492]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0448]))])
OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0477]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0483]))])
OrderedDict([('linear.weight', tensor([[1.9958]])), ('linear.bias', tensor([1.0429]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0425]))])
OrderedDict([('linear.weight', tensor([[1.9957]])), ('linear.bias', tensor([1.0420]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0580]))])
OrderedDict([('linear.weight', tensor([[2.0037]])), ('linear.bias', tensor([1.0649]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0586]))])
OrderedDict([('linear.weight', tensor([[2.0014]])), ('linear.bias', tensor([1.0575]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0557]))])
OrderedDict([('linear.weight', tensor([[1.9964]])), ('linear.bias', tensor([1.0521]))])
OrderedDict([('linear.weight', tensor([[1.9962]])), ('linear.bias', tensor([1.0489]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0501]))])
OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0450]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0457]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0471]))])
OrderedDict([('linear.weight', tensor([[1.9985]])), ('linear.bias', tensor([1.0472]))])
OrderedDict([('linear.weight', tensor([[2.0002]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0509]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0444]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0473]))])
OrderedDict([('linear.weight', tensor([[1.9941]])), ('linear.bias', tensor([1.0401]))])
OrderedDict([('linear.weight', tensor([[1.9945]])), ('linear.bias', tensor([1.0404]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0495]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0526]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0038]])), ('linear.bias', tensor([1.0397]))])
OrderedDict([('linear.weight', tensor([[2.0023]])), ('linear.bias', tensor([1.0358]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0353]))])
OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0364]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0449]))])
OrderedDict([('linear.weight', tensor([[2.0045]])), ('linear.bias', tensor([1.0495]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0516]))])
OrderedDict([('linear.weight', tensor([[2.0061]])), ('linear.bias', tensor([1.0511]))])
OrderedDict([('linear.weight', tensor([[2.0054]])), ('linear.bias', tensor([1.0493]))])
OrderedDict([('linear.weight', tensor([[2.0042]])), ('linear.bias', tensor([1.0500]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[1.9964]])), ('linear.bias', tensor([1.0452]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0439]))])
OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0415]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0429]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0442]))])
OrderedDict([('linear.weight', tensor([[1.9939]])), ('linear.bias', tensor([1.0386]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0433]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0541]))])
OrderedDict([('linear.weight', tensor([[2.0047]])), ('linear.bias', tensor([1.0583]))])
OrderedDict([('linear.weight', tensor([[2.0059]])), ('linear.bias', tensor([1.0605]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0404]))])
OrderedDict([('linear.weight', tensor([[1.9946]])), ('linear.bias', tensor([1.0364]))])
OrderedDict([('linear.weight', tensor([[1.9962]])), ('linear.bias', tensor([1.0433]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0428]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0477]))])
OrderedDict([('linear.weight', tensor([[1.9926]])), ('linear.bias', tensor([1.0429]))])
OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0452]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[2.0024]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0495]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0507]))])
OrderedDict([('linear.weight', tensor([[1.9945]])), ('linear.bias', tensor([1.0513]))])
OrderedDict([('linear.weight', tensor([[1.9950]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', tensor([[1.9926]])), ('linear.bias', tensor([1.0501]))])
OrderedDict([('linear.weight', tensor([[1.9958]])), ('linear.bias', tensor([1.0536]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0624]))])
OrderedDict([('linear.weight', tensor([[2.0018]])), ('linear.bias', tensor([1.0589]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0587]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0615]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0542]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0578]))])
OrderedDict([('linear.weight', tensor([[2.0028]])), ('linear.bias', tensor([1.0575]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0536]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0489]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0564]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0554]))])
OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0531]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0521]))])
OrderedDict([('linear.weight', tensor([[1.9962]])), ('linear.bias', tensor([1.0537]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0568]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0579]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', tensor([[1.9920]])), ('linear.bias', tensor([1.0468]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0557]))])
OrderedDict([('linear.weight', tensor([[1.9931]])), ('linear.bias', tensor([1.0485]))])
OrderedDict([('linear.weight', tensor([[1.9934]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[1.9930]])), ('linear.bias', tensor([1.0485]))])
OrderedDict([('linear.weight', tensor([[1.9928]])), ('linear.bias', tensor([1.0451]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0507]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0398]))])
OrderedDict([('linear.weight', tensor([[1.9974]])), ('linear.bias', tensor([1.0408]))])
OrderedDict([('linear.weight', tensor([[1.9937]])), ('linear.bias', tensor([1.0336]))])
OrderedDict([('linear.weight', tensor([[1.9946]])), ('linear.bias', tensor([1.0389]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0428]))])
OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0407]))])
OrderedDict([('linear.weight', tensor([[1.9949]])), ('linear.bias', tensor([1.0393]))])
OrderedDict([('linear.weight', tensor([[1.9950]])), ('linear.bias', tensor([1.0409]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0467]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0396]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0396]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0434]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0377]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0423]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0401]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0380]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0402]))])
OrderedDict([('linear.weight', tensor([[2.0036]])), ('linear.bias', tensor([1.0465]))])
OrderedDict([('linear.weight', tensor([[2.0045]])), ('linear.bias', tensor([1.0519]))])
OrderedDict([('linear.weight', tensor([[2.0058]])), ('linear.bias', tensor([1.0545]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0546]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0541]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0458]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0410]))])
OrderedDict([('linear.weight', tensor([[1.9932]])), ('linear.bias', tensor([1.0401]))])
OrderedDict([('linear.weight', tensor([[1.9900]])), ('linear.bias', tensor([1.0346]))])
OrderedDict([('linear.weight', tensor([[1.9906]])), ('linear.bias', tensor([1.0410]))])
OrderedDict([('linear.weight', tensor([[1.9934]])), ('linear.bias', tensor([1.0501]))])
OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0536]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0570]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0658]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0558]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0580]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0553]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0553]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0631]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0546]))])
OrderedDict([('linear.weight', tensor([[2.0019]])), ('linear.bias', tensor([1.0589]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0564]))])
OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', tensor([[1.9945]])), ('linear.bias', tensor([1.0483]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0580]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0581]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0546]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0509]))])
OrderedDict([('linear.weight', tensor([[2.0028]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0578]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0600]))])
OrderedDict([('linear.weight', tensor([[2.0049]])), ('linear.bias', tensor([1.0627]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0543]))])
OrderedDict([('linear.weight', tensor([[1.9950]])), ('linear.bias', tensor([1.0436]))])
OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0451]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0045]])), ('linear.bias', tensor([1.0558]))])
OrderedDict([('linear.weight', tensor([[2.0014]])), ('linear.bias', tensor([1.0522]))])
OrderedDict([('linear.weight', tensor([[2.0028]])), ('linear.bias', tensor([1.0567]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0519]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0542]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0589]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0517]))])
OrderedDict([('linear.weight', tensor([[1.9951]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0557]))])
OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0538]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9932]])), ('linear.bias', tensor([1.0443]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0539]))])
OrderedDict([('linear.weight', tensor([[2.0019]])), ('linear.bias', tensor([1.0570]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0477]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', tensor([[2.0014]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0406]))])
OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0434]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0472]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0560]))])
OrderedDict([('linear.weight', tensor([[2.0039]])), ('linear.bias', tensor([1.0611]))])
OrderedDict([('linear.weight', tensor([[2.0063]])), ('linear.bias', tensor([1.0640]))])
OrderedDict([('linear.weight', tensor([[2.0057]])), ('linear.bias', tensor([1.0633]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0575]))])
OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0551]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0585]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0493]))])
OrderedDict([('linear.weight', tensor([[1.9925]])), ('linear.bias', tensor([1.0440]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9949]])), ('linear.bias', tensor([1.0498]))])
OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0554]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0485]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0535]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0551]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0585]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0573]))])
OrderedDict([('linear.weight', tensor([[2.0018]])), ('linear.bias', tensor([1.0651]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0610]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0615]))])
OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0605]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0584]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0540]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0513]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9925]])), ('linear.bias', tensor([1.0477]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0559]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0504]))])
OrderedDict([('linear.weight', tensor([[1.9930]])), ('linear.bias', tensor([1.0410]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0465]))])
OrderedDict([('linear.weight', tensor([[1.9964]])), ('linear.bias', tensor([1.0458]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0462]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[1.9947]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0542]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0517]))])
OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0531]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0521]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0499]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0489]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[1.9974]])), ('linear.bias', tensor([1.0403]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0092]])), ('linear.bias', tensor([1.0593]))])
OrderedDict([('linear.weight', tensor([[2.0071]])), ('linear.bias', tensor([1.0540]))])
OrderedDict([('linear.weight', tensor([[2.0056]])), ('linear.bias', tensor([1.0503]))])
OrderedDict([('linear.weight', tensor([[2.0044]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', tensor([[2.0043]])), ('linear.bias', tensor([1.0514]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0459]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', tensor([[2.0057]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[2.0053]])), ('linear.bias', tensor([1.0546]))])
OrderedDict([('linear.weight', tensor([[2.0060]])), ('linear.bias', tensor([1.0568]))])
OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0583]))])
OrderedDict([('linear.weight', tensor([[2.0038]])), ('linear.bias', tensor([1.0587]))])
OrderedDict([('linear.weight', tensor([[2.0023]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[1.9996]])), ('linear.bias', tensor([1.0538]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0557]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0462]))])
OrderedDict([('linear.weight', tensor([[2.0018]])), ('linear.bias', tensor([1.0500]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0445]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0407]))])
OrderedDict([('linear.weight', tensor([[1.9925]])), ('linear.bias', tensor([1.0342]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0529]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0560]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0541]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0587]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0505]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[1.9927]])), ('linear.bias', tensor([1.0397]))])
OrderedDict([('linear.weight', tensor([[1.9918]])), ('linear.bias', tensor([1.0381]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0447]))])
OrderedDict([('linear.weight', tensor([[2.0066]])), ('linear.bias', tensor([1.0503]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0405]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0433]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0468]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0502]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0490]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0551]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0014]])), ('linear.bias', tensor([1.0541]))])
OrderedDict([('linear.weight', tensor([[2.0037]])), ('linear.bias', tensor([1.0598]))])
OrderedDict([('linear.weight', tensor([[2.0045]])), ('linear.bias', tensor([1.0631]))])
OrderedDict([('linear.weight', tensor([[2.0021]])), ('linear.bias', tensor([1.0606]))])
OrderedDict([('linear.weight', tensor([[2.0069]])), ('linear.bias', tensor([1.0673]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0539]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0556]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0580]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0510]))])
OrderedDict([('linear.weight', tensor([[1.9933]])), ('linear.bias', tensor([1.0428]))])
OrderedDict([('linear.weight', tensor([[1.9917]])), ('linear.bias', tensor([1.0385]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0569]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0598]))])
OrderedDict([('linear.weight', tensor([[2.0040]])), ('linear.bias', tensor([1.0617]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0621]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0617]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0582]))])
OrderedDict([('linear.weight', tensor([[2.0018]])), ('linear.bias', tensor([1.0587]))])
OrderedDict([('linear.weight', tensor([[2.0050]])), ('linear.bias', tensor([1.0654]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[1.9932]])), ('linear.bias', tensor([1.0493]))])
OrderedDict([('linear.weight', tensor([[1.9899]])), ('linear.bias', tensor([1.0422]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0516]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[1.9996]])), ('linear.bias', tensor([1.0505]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[2.0013]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0511]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0474]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0577]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0636]))])
OrderedDict([('linear.weight', tensor([[1.9931]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tensor([[1.9903]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[1.9933]])), ('linear.bias', tensor([1.0483]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0510]))])
OrderedDict([('linear.weight', tensor([[1.9946]])), ('linear.bias', tensor([1.0472]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0504]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0551]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0493]))])
OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0591]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0513]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0485]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0507]))])
OrderedDict([('linear.weight', tensor([[1.9954]])), ('linear.bias', tensor([1.0423]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0570]))])
OrderedDict([('linear.weight', tensor([[2.0072]])), ('linear.bias', tensor([1.0624]))])
OrderedDict([('linear.weight', tensor([[2.0045]])), ('linear.bias', tensor([1.0538]))])
OrderedDict([('linear.weight', tensor([[2.0060]])), ('linear.bias', tensor([1.0564]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0451]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0457]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0471]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0580]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0573]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0549]))])
OrderedDict([('linear.weight', tensor([[2.0002]])), ('linear.bias', tensor([1.0573]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0604]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0583]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0571]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0038]])), ('linear.bias', tensor([1.0581]))])
OrderedDict([('linear.weight', tensor([[2.0033]])), ('linear.bias', tensor([1.0578]))])
OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0558]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0555]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0566]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0567]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0499]))])
OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0413]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9941]])), ('linear.bias', tensor([1.0542]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0560]))])
OrderedDict([('linear.weight', tensor([[1.9944]])), ('linear.bias', tensor([1.0543]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0541]))])
OrderedDict([('linear.weight', tensor([[1.9931]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[1.9939]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0522]))])
OrderedDict([('linear.weight', tensor([[1.9922]])), ('linear.bias', tensor([1.0454]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0541]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0603]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0556]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0516]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0502]))])
OrderedDict([('linear.weight', tensor([[2.0014]])), ('linear.bias', tensor([1.0577]))])
OrderedDict([('linear.weight', tensor([[2.0021]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0553]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0456]))])
OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0536]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0504]))])
OrderedDict([('linear.weight', tensor([[1.9996]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', tensor([[2.0028]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0580]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[2.0028]])), ('linear.bias', tensor([1.0505]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0603]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0558]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0588]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0427]))])
OrderedDict([('linear.weight', tensor([[2.0043]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[2.0068]])), ('linear.bias', tensor([1.0545]))])
OrderedDict([('linear.weight', tensor([[2.0052]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[2.0028]])), ('linear.bias', tensor([1.0498]))])
OrderedDict([('linear.weight', tensor([[2.0053]])), ('linear.bias', tensor([1.0566]))])
OrderedDict([('linear.weight', tensor([[2.0033]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[2.0058]])), ('linear.bias', tensor([1.0577]))])
OrderedDict([('linear.weight', tensor([[2.0051]])), ('linear.bias', tensor([1.0543]))])
OrderedDict([('linear.weight', tensor([[2.0048]])), ('linear.bias', tensor([1.0535]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0591]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0571]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0580]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0549]))])
OrderedDict([('linear.weight', tensor([[2.0045]])), ('linear.bias', tensor([1.0632]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0622]))])
OrderedDict([('linear.weight', tensor([[2.0023]])), ('linear.bias', tensor([1.0655]))])
OrderedDict([('linear.weight', tensor([[2.0038]])), ('linear.bias', tensor([1.0686]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0597]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0539]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0581]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9935]])), ('linear.bias', tensor([1.0458]))])
OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0544]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0513]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0593]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0630]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0593]))])
OrderedDict([('linear.weight', tensor([[1.9933]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[1.9918]])), ('linear.bias', tensor([1.0463]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0352]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0364]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0447]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0446]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[1.9954]])), ('linear.bias', tensor([1.0502]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0576]))])
OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9941]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0565]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0463]))])
OrderedDict([('linear.weight', tensor([[1.9925]])), ('linear.bias', tensor([1.0423]))])
OrderedDict([('linear.weight', tensor([[1.9936]])), ('linear.bias', tensor([1.0453]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0541]))])
OrderedDict([('linear.weight', tensor([[1.9949]])), ('linear.bias', tensor([1.0467]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0479]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0437]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0450]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0514]))])
OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0449]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0520]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0520]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0605]))])
OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0487]))])
OrderedDict([('linear.weight', tensor([[1.9944]])), ('linear.bias', tensor([1.0453]))])
OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0421]))])
OrderedDict([('linear.weight', tensor([[1.9932]])), ('linear.bias', tensor([1.0376]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0421]))])
OrderedDict([('linear.weight', tensor([[1.9931]])), ('linear.bias', tensor([1.0364]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9996]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0553]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0520]))])
OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0537]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0537]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0554]))])
OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0556]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0568]))])
OrderedDict([('linear.weight', tensor([[2.0061]])), ('linear.bias', tensor([1.0634]))])
OrderedDict([('linear.weight', tensor([[2.0040]])), ('linear.bias', tensor([1.0579]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[1.9949]])), ('linear.bias', tensor([1.0487]))])
OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0540]))])
OrderedDict([('linear.weight', tensor([[2.0050]])), ('linear.bias', tensor([1.0624]))])
OrderedDict([('linear.weight', tensor([[1.9974]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0513]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0504]))])
OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0495]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0542]))])
OrderedDict([('linear.weight', tensor([[2.0023]])), ('linear.bias', tensor([1.0542]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0385]))])
OrderedDict([('linear.weight', tensor([[1.9949]])), ('linear.bias', tensor([1.0411]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0473]))])
OrderedDict([('linear.weight', tensor([[1.9946]])), ('linear.bias', tensor([1.0419]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0472]))])
OrderedDict([('linear.weight', tensor([[1.9974]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[1.9929]])), ('linear.bias', tensor([1.0401]))])
OrderedDict([('linear.weight', tensor([[1.9941]])), ('linear.bias', tensor([1.0441]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0456]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0542]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0610]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0587]))])
OrderedDict([('linear.weight', tensor([[2.0033]])), ('linear.bias', tensor([1.0548]))])
OrderedDict([('linear.weight', tensor([[2.0047]])), ('linear.bias', tensor([1.0578]))])
OrderedDict([('linear.weight', tensor([[2.0053]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[2.0053]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[2.0053]])), ('linear.bias', tensor([1.0571]))])
OrderedDict([('linear.weight', tensor([[2.0052]])), ('linear.bias', tensor([1.0568]))])
OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0479]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0477]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0526]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0501]))])
OrderedDict([('linear.weight', tensor([[2.0033]])), ('linear.bias', tensor([1.0589]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0597]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0581]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0575]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0587]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0551]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0618]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0449]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0437]))])
OrderedDict([('linear.weight', tensor([[2.0002]])), ('linear.bias', tensor([1.0460]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0419]))])
OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0499]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0423]))])
OrderedDict([('linear.weight', tensor([[2.0033]])), ('linear.bias', tensor([1.0485]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0446]))])
OrderedDict([('linear.weight', tensor([[2.0042]])), ('linear.bias', tensor([1.0437]))])
OrderedDict([('linear.weight', tensor([[2.0094]])), ('linear.bias', tensor([1.0517]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[2.0037]])), ('linear.bias', tensor([1.0479]))])
OrderedDict([('linear.weight', tensor([[2.0069]])), ('linear.bias', tensor([1.0565]))])
OrderedDict([('linear.weight', tensor([[2.0064]])), ('linear.bias', tensor([1.0509]))])
OrderedDict([('linear.weight', tensor([[2.0089]])), ('linear.bias', tensor([1.0600]))])
OrderedDict([('linear.weight', tensor([[2.0036]])), ('linear.bias', tensor([1.0533]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0516]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0535]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0481]))])
OrderedDict([('linear.weight', tensor([[1.9962]])), ('linear.bias', tensor([1.0402]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0414]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0093]])), ('linear.bias', tensor([1.0708]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0610]))])
OrderedDict([('linear.weight', tensor([[1.9958]])), ('linear.bias', tensor([1.0524]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0513]))])
OrderedDict([('linear.weight', tensor([[1.9948]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[1.9927]])), ('linear.bias', tensor([1.0521]))])
OrderedDict([('linear.weight', tensor([[1.9897]])), ('linear.bias', tensor([1.0475]))])
OrderedDict([('linear.weight', tensor([[1.9907]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[1.9903]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[1.9892]])), ('linear.bias', tensor([1.0471]))])
OrderedDict([('linear.weight', tensor([[1.9902]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0069]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[2.0072]])), ('linear.bias', tensor([1.0519]))])
OrderedDict([('linear.weight', tensor([[2.0085]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[2.0108]])), ('linear.bias', tensor([1.0605]))])
OrderedDict([('linear.weight', tensor([[2.0110]])), ('linear.bias', tensor([1.0572]))])
OrderedDict([('linear.weight', tensor([[2.0101]])), ('linear.bias', tensor([1.0558]))])
OrderedDict([('linear.weight', tensor([[2.0070]])), ('linear.bias', tensor([1.0504]))])
OrderedDict([('linear.weight', tensor([[2.0051]])), ('linear.bias', tensor([1.0456]))])
OrderedDict([('linear.weight', tensor([[2.0014]])), ('linear.bias', tensor([1.0403]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0429]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0425]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9925]])), ('linear.bias', tensor([1.0451]))])
OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0500]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[1.9944]])), ('linear.bias', tensor([1.0465]))])
OrderedDict([('linear.weight', tensor([[1.9907]])), ('linear.bias', tensor([1.0394]))])
OrderedDict([('linear.weight', tensor([[1.9902]])), ('linear.bias', tensor([1.0401]))])
OrderedDict([('linear.weight', tensor([[1.9906]])), ('linear.bias', tensor([1.0414]))])
OrderedDict([('linear.weight', tensor([[1.9926]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0571]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0600]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0524]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0526]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[1.9974]])), ('linear.bias', tensor([1.0529]))])
OrderedDict([('linear.weight', tensor([[1.9962]])), ('linear.bias', tensor([1.0452]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9929]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[1.9899]])), ('linear.bias', tensor([1.0411]))])
OrderedDict([('linear.weight', tensor([[1.9954]])), ('linear.bias', tensor([1.0526]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0598]))])
OrderedDict([('linear.weight', tensor([[2.0002]])), ('linear.bias', tensor([1.0535]))])
OrderedDict([('linear.weight', tensor([[2.0021]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0623]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0540]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0455]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0036]])), ('linear.bias', tensor([1.0610]))])
OrderedDict([('linear.weight', tensor([[1.9948]])), ('linear.bias', tensor([1.0501]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0543]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0519]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', tensor([[1.9987]])), ('linear.bias', tensor([1.0591]))])
OrderedDict([('linear.weight', tensor([[1.9987]])), ('linear.bias', tensor([1.0596]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0662]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0619]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0595]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0551]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', tensor([[1.9944]])), ('linear.bias', tensor([1.0458]))])
OrderedDict([('linear.weight', tensor([[1.9908]])), ('linear.bias', tensor([1.0387]))])
OrderedDict([('linear.weight', tensor([[1.9947]])), ('linear.bias', tensor([1.0471]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0424]))])
OrderedDict([('linear.weight', tensor([[1.9962]])), ('linear.bias', tensor([1.0517]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0522]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0428]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0556]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9941]])), ('linear.bias', tensor([1.0472]))])
OrderedDict([('linear.weight', tensor([[1.9925]])), ('linear.bias', tensor([1.0442]))])
OrderedDict([('linear.weight', tensor([[1.9905]])), ('linear.bias', tensor([1.0429]))])
OrderedDict([('linear.weight', tensor([[1.9921]])), ('linear.bias', tensor([1.0445]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0553]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0610]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0581]))])
OrderedDict([('linear.weight', tensor([[1.9985]])), ('linear.bias', tensor([1.0632]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0653]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0656]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0533]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0586]))])
OrderedDict([('linear.weight', tensor([[1.9958]])), ('linear.bias', tensor([1.0535]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[1.9923]])), ('linear.bias', tensor([1.0452]))])
OrderedDict([('linear.weight', tensor([[1.9919]])), ('linear.bias', tensor([1.0440]))])
OrderedDict([('linear.weight', tensor([[1.9914]])), ('linear.bias', tensor([1.0419]))])
OrderedDict([('linear.weight', tensor([[1.9946]])), ('linear.bias', tensor([1.0483]))])
OrderedDict([('linear.weight', tensor([[1.9951]])), ('linear.bias', tensor([1.0521]))])
OrderedDict([('linear.weight', tensor([[1.9954]])), ('linear.bias', tensor([1.0498]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0580]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9951]])), ('linear.bias', tensor([1.0551]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0633]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0616]))])
OrderedDict([('linear.weight', tensor([[1.9918]])), ('linear.bias', tensor([1.0505]))])
OrderedDict([('linear.weight', tensor([[1.9887]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[1.9869]])), ('linear.bias', tensor([1.0451]))])
OrderedDict([('linear.weight', tensor([[1.9915]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[1.9928]])), ('linear.bias', tensor([1.0486]))])
OrderedDict([('linear.weight', tensor([[1.9934]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', tensor([[1.9945]])), ('linear.bias', tensor([1.0540]))])
OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9985]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0455]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0487]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0457]))])
OrderedDict([('linear.weight', tensor([[2.0050]])), ('linear.bias', tensor([1.0560]))])
OrderedDict([('linear.weight', tensor([[2.0036]])), ('linear.bias', tensor([1.0526]))])
OrderedDict([('linear.weight', tensor([[2.0013]])), ('linear.bias', tensor([1.0526]))])
OrderedDict([('linear.weight', tensor([[2.0019]])), ('linear.bias', tensor([1.0541]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0499]))])
OrderedDict([('linear.weight', tensor([[1.9947]])), ('linear.bias', tensor([1.0408]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0497]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0524]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0541]))])
OrderedDict([('linear.weight', tensor([[1.9987]])), ('linear.bias', tensor([1.0556]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0503]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0447]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0492]))])
OrderedDict([('linear.weight', tensor([[2.0036]])), ('linear.bias', tensor([1.0570]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0474]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0465]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0497]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0432]))])
OrderedDict([('linear.weight', tensor([[1.9934]])), ('linear.bias', tensor([1.0414]))])
OrderedDict([('linear.weight', tensor([[1.9932]])), ('linear.bias', tensor([1.0429]))])
OrderedDict([('linear.weight', tensor([[1.9964]])), ('linear.bias', tensor([1.0493]))])
OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0487]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0524]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0565]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0595]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0539]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0496]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0548]))])
OrderedDict([('linear.weight', tensor([[2.0002]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0496]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0446]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0502]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[2.0044]])), ('linear.bias', tensor([1.0558]))])
OrderedDict([('linear.weight', tensor([[2.0040]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9947]])), ('linear.bias', tensor([1.0389]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0436]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0459]))])
OrderedDict([('linear.weight', tensor([[2.0063]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[2.0085]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[2.0082]])), ('linear.bias', tensor([1.0564]))])
OrderedDict([('linear.weight', tensor([[2.0061]])), ('linear.bias', tensor([1.0559]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0537]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0471]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0553]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9987]])), ('linear.bias', tensor([1.0474]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0514]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', tensor([[2.0042]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0573]))])
OrderedDict([('linear.weight', tensor([[2.0047]])), ('linear.bias', tensor([1.0576]))])
OrderedDict([('linear.weight', tensor([[2.0043]])), ('linear.bias', tensor([1.0583]))])
OrderedDict([('linear.weight', tensor([[2.0053]])), ('linear.bias', tensor([1.0615]))])
OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0496]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0100]])), ('linear.bias', tensor([1.0643]))])
OrderedDict([('linear.weight', tensor([[2.0073]])), ('linear.bias', tensor([1.0599]))])
OrderedDict([('linear.weight', tensor([[2.0061]])), ('linear.bias', tensor([1.0570]))])
OrderedDict([('linear.weight', tensor([[2.0058]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[2.0073]])), ('linear.bias', tensor([1.0544]))])
OrderedDict([('linear.weight', tensor([[2.0047]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[2.0039]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0489]))])
OrderedDict([('linear.weight', tensor([[2.0059]])), ('linear.bias', tensor([1.0551]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0486]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0568]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0516]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0471]))])
OrderedDict([('linear.weight', tensor([[1.9964]])), ('linear.bias', tensor([1.0452]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0493]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0505]))])
OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0579]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0588]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0445]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0546]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0517]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0540]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0526]))])
OrderedDict([('linear.weight', tensor([[2.0058]])), ('linear.bias', tensor([1.0582]))])
OrderedDict([('linear.weight', tensor([[2.0003]])), ('linear.bias', tensor([1.0520]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0463]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', tensor([[2.0043]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', tensor([[2.0042]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0481]))])
OrderedDict([('linear.weight', tensor([[2.0002]])), ('linear.bias', tensor([1.0447]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0537]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[1.9996]])), ('linear.bias', tensor([1.0521]))])
OrderedDict([('linear.weight', tensor([[1.9950]])), ('linear.bias', tensor([1.0472]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0520]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0092]])), ('linear.bias', tensor([1.0639]))])
OrderedDict([('linear.weight', tensor([[2.0073]])), ('linear.bias', tensor([1.0591]))])
OrderedDict([('linear.weight', tensor([[2.0072]])), ('linear.bias', tensor([1.0591]))])
OrderedDict([('linear.weight', tensor([[2.0087]])), ('linear.bias', tensor([1.0558]))])
OrderedDict([('linear.weight', tensor([[2.0040]])), ('linear.bias', tensor([1.0487]))])
OrderedDict([('linear.weight', tensor([[2.0042]])), ('linear.bias', tensor([1.0496]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0441]))])
OrderedDict([('linear.weight', tensor([[2.0019]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[1.9957]])), ('linear.bias', tensor([1.0444]))])
OrderedDict([('linear.weight', tensor([[1.9950]])), ('linear.bias', tensor([1.0439]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0485]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0496]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0545]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0524]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0451]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0500]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0524]))])
OrderedDict([('linear.weight', tensor([[2.0019]])), ('linear.bias', tensor([1.0564]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0514]))])
OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0545]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0555]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0573]))])
OrderedDict([('linear.weight', tensor([[1.9915]])), ('linear.bias', tensor([1.0487]))])
OrderedDict([('linear.weight', tensor([[1.9904]])), ('linear.bias', tensor([1.0448]))])
OrderedDict([('linear.weight', tensor([[1.9934]])), ('linear.bias', tensor([1.0444]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0558]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0609]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0616]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0544]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0592]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0467]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0504]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0485]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0443]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0423]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0422]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0479]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0555]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0406]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0419]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0498]))])
OrderedDict([('linear.weight', tensor([[2.0036]])), ('linear.bias', tensor([1.0537]))])
OrderedDict([('linear.weight', tensor([[2.0047]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[2.0064]])), ('linear.bias', tensor([1.0586]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0542]))])
OrderedDict([('linear.weight', tensor([[2.0048]])), ('linear.bias', tensor([1.0601]))])
OrderedDict([('linear.weight', tensor([[2.0068]])), ('linear.bias', tensor([1.0667]))])
OrderedDict([('linear.weight', tensor([[2.0060]])), ('linear.bias', tensor([1.0614]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0053]])), ('linear.bias', tensor([1.0470]))])
OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0411]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0400]))])
OrderedDict([('linear.weight', tensor([[2.0045]])), ('linear.bias', tensor([1.0495]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0404]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0354]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0379]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0360]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0423]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0364]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0389]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0519]))])
OrderedDict([('linear.weight', tensor([[1.9923]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0585]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[1.9948]])), ('linear.bias', tensor([1.0500]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0533]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0607]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0551]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0576]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9954]])), ('linear.bias', tensor([1.0536]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0581]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0590]))])
OrderedDict([('linear.weight', tensor([[1.9987]])), ('linear.bias', tensor([1.0601]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0463]))])
OrderedDict([('linear.weight', tensor([[1.9950]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[1.9921]])), ('linear.bias', tensor([1.0402]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0580]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0623]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0603]))])
OrderedDict([('linear.weight', tensor([[1.9947]])), ('linear.bias', tensor([1.0516]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0546]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0452]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0487]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0475]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0537]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0505]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9957]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0529]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0511]))])
OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0607]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0581]))])
OrderedDict([('linear.weight', tensor([[2.0018]])), ('linear.bias', tensor([1.0625]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0548]))])
OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0517]))])
OrderedDict([('linear.weight', tensor([[1.9950]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', tensor([[1.9937]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', tensor([[1.9910]])), ('linear.bias', tensor([1.0441]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9932]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0581]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0598]))])
OrderedDict([('linear.weight', tensor([[1.9937]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0533]))])
OrderedDict([('linear.weight', tensor([[1.9931]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[1.9921]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[1.9930]])), ('linear.bias', tensor([1.0526]))])
OrderedDict([('linear.weight', tensor([[1.9884]])), ('linear.bias', tensor([1.0435]))])
OrderedDict([('linear.weight', tensor([[1.9869]])), ('linear.bias', tensor([1.0400]))])
OrderedDict([('linear.weight', tensor([[1.9904]])), ('linear.bias', tensor([1.0457]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0067]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[2.0037]])), ('linear.bias', tensor([1.0545]))])
OrderedDict([('linear.weight', tensor([[2.0050]])), ('linear.bias', tensor([1.0538]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0451]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0539]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0471]))])
OrderedDict([('linear.weight', tensor([[2.0037]])), ('linear.bias', tensor([1.0536]))])
OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0637]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0582]))])
OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0571]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0589]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0595]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0582]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0548]))])
OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0582]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0623]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9943]])), ('linear.bias', tensor([1.0511]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0595]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0632]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0524]))])
OrderedDict([('linear.weight', tensor([[2.]])), ('linear.bias', tensor([1.0591]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[1.9996]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0617]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0555]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tenso

OrderedDict([('linear.weight', tensor([[1.9947]])), ('linear.bias', tensor([1.0405]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0465]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0509]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0499]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0565]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0576]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[2.0023]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0104]])), ('linear.bias', tensor([1.0566]))])
OrderedDict([('linear.weight', tensor([[2.0084]])), ('linear.bias', tensor([1.0545]))])
OrderedDict([('linear.weight', tensor([[2.0076]])), ('linear.bias', tensor([1.0545]))])
OrderedDict([('linear.weight', tensor([[2.0081]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[2.0062]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tensor([[2.0078]])), ('linear.bias', tensor([1.0548]))])
OrderedDict([('linear.weight', tensor([[2.0078]])), ('linear.bias', tensor([1.0565]))])
OrderedDict([('linear.weight', tensor([[2.0070]])), ('linear.bias', tensor([1.0553]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0445]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0455]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0441]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0002]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0425]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0409]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0404]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0362]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0380]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0394]))])
OrderedDict([('linear.weight', tensor([[2.0013]])), ('linear.bias', tensor([1.0470]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0477]))])
OrderedDict([('linear.weight', tensor([[2.0059]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[2.0062]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9934]])), ('linear.bias', tensor([1.0573]))])
OrderedDict([('linear.weight', tensor([[1.9903]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[1.9887]])), ('linear.bias', tensor([1.0499]))])
OrderedDict([('linear.weight', tensor([[1.9860]])), ('linear.bias', tensor([1.0456]))])
OrderedDict([('linear.weight', tensor([[1.9849]])), ('linear.bias', tensor([1.0438]))])
OrderedDict([('linear.weight', tensor([[1.9872]])), ('linear.bias', tensor([1.0454]))])
OrderedDict([('linear.weight', tensor([[1.9895]])), ('linear.bias', tensor([1.0474]))])
OrderedDict([('linear.weight', tensor([[1.9937]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0545]))])
OrderedDict([('linear.weight', tensor([[1.9949]])), ('linear.bias', tensor([1.0538]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0044]])), ('linear.bias', tensor([1.0643]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0597]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0558]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0566]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0524]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', tensor([[2.0040]])), ('linear.bias', tensor([1.0564]))])
OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0645]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0535]))])
OrderedDict([('linear.weight', tensor([[1.9962]])), ('linear.bias', tensor([1.0496]))])
OrderedDict([('linear.weight', tensor([[1.9974]])), ('linear.bias', tensor([1.0481]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0559]))])
OrderedDict([('linear.weight', tensor([[2.0013]])), ('linear.bias', tensor([1.0472]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0428]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0516]))])
OrderedDict([('linear.weight', tensor([[1.9929]])), ('linear.bias', tensor([1.0435]))])
OrderedDict([('linear.weight', tensor([[1.9936]])), ('linear.bias', tensor([1.0445]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0418]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0370]))])
OrderedDict([('linear.weight', tensor([[1.9930]])), ('linear.bias', tensor([1.0370]))])
OrderedDict([('linear.weight', tensor([[1.9947]])), ('linear.bias', tensor([1.0406]))])
OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0429]))])
OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0453]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0414]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0474]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0468]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0603]))])
OrderedDict([('linear.weight', tensor([[2.0070]])), ('linear.bias', tensor([1.0671]))])
OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0582]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0595]))])
OrderedDict([('linear.weight', tensor([[1.9985]])), ('linear.bias', tensor([1.0492]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0448]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0462]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0380]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0427]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0419]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0023]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[2.0028]])), ('linear.bias', tensor([1.0531]))])
OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0496]))])
OrderedDict([('linear.weight', tensor([[2.0033]])), ('linear.bias', tensor([1.0555]))])
OrderedDict([('linear.weight', tensor([[2.0018]])), ('linear.bias', tensor([1.0496]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0571]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9888]])), ('linear.bias', tensor([1.0362]))])
OrderedDict([('linear.weight', tensor([[1.9898]])), ('linear.bias', tensor([1.0374]))])
OrderedDict([('linear.weight', tensor([[1.9901]])), ('linear.bias', tensor([1.0381]))])
OrderedDict([('linear.weight', tensor([[1.9914]])), ('linear.bias', tensor([1.0407]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0522]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0489]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0429]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[1.9946]])), ('linear.bias', tensor([1.0386]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0557]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0568]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0432]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0391]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0373]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0351]))])
OrderedDict([('linear.weight', tensor([[2.0047]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0436]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0455]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0434]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0023]])), ('linear.bias', tensor([1.0576]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0554]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0573]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0626]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0616]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0592]))])
OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', tensor([[1.9987]])), ('linear.bias', tensor([1.0583]))])
OrderedDict([('linear.weight', tensor([[1.9996]])), ('linear.bias', tensor([1.0622]))])
OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9987]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0449]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0436]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0361]))])
OrderedDict([('linear.weight', tensor([[2.0013]])), ('linear.bias', tensor([1.0419]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0414]))])
OrderedDict([('linear.weight', tensor([[1.9985]])), ('linear.bias', tensor([1.0350]))])
OrderedDict([('linear.weight', tensor([[2.0044]])), ('linear.bias', tensor([1.0417]))])
OrderedDict([('linear.weight', tensor([[2.0069]])), ('linear.bias', tensor([1.0446]))])
OrderedDict([('linear.weight', tensor([[2.0078]])), ('linear.bias', tensor([1.0489]))])
OrderedDict([('linear.weight', tensor([[2.0127]])), ('linear.bias', tensor([1.0564]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0442]))])
OrderedDict([('linear.weight', tensor([[2.0051]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[2.0024]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[2.0021]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[2.0002]])), ('linear.bias', tensor([1.0497]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0467]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0465]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0499]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0582]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0486]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0455]))])
OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0382]))])
OrderedDict([('linear.weight', tensor([[1.9925]])), ('linear.bias', tensor([1.0344]))])
OrderedDict([('linear.weight', tensor([[1.9944]])), ('linear.bias', tensor([1.0399]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0479]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tensor([[2.0039]])), ('linear.bias', tensor([1.0557]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0538]))])
OrderedDict([('linear.weight', tensor([[2.0043]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0588]))])
OrderedDict([('linear.weight', tensor([[1.9948]])), ('linear.bias', tensor([1.0593]))])
OrderedDict([('linear.weight', tensor([[1.9951]])), ('linear.bias', tensor([1.0603]))])
OrderedDict([('linear.weight', tensor([[1.9936]])), ('linear.bias', tensor([1.0583]))])
OrderedDict([('linear.weight', tensor([[1.9911]])), ('linear.bias', tensor([1.0558]))])
OrderedDict([('linear.weight', tensor([[1.9916]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[1.9931]])), ('linear.bias', tensor([1.0621]))])
OrderedDict([('linear.weight', tensor([[1.9930]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[1.9912]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[1.9934]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0591]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0477]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0397]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0467]))])
OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[2.0021]])), ('linear.bias', tensor([1.0517]))])
OrderedDict([('linear.weight', tensor([[1.9964]])), ('linear.bias', tensor([1.0441]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0470]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0487]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0537]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[2.0038]])), ('linear.bias', tensor([1.0546]))])
OrderedDict([('linear.weight', tensor([[2.0048]])), ('linear.bias', tensor([1.0568]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0436]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0428]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0458]))])
OrderedDict([('linear.weight', tensor([[1.9987]])), ('linear.bias', tensor([1.0482]))])
OrderedDict([('linear.weight', tensor([[1.9985]])), ('linear.bias', tensor([1.0455]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0401]))])
OrderedDict([('linear.weight', tensor([[1.9945]])), ('linear.bias', tensor([1.0353]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0047]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[2.0036]])), ('linear.bias', tensor([1.0481]))])
OrderedDict([('linear.weight', tensor([[2.0080]])), ('linear.bias', tensor([1.0549]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0495]))])
OrderedDict([('linear.weight', tensor([[2.0069]])), ('linear.bias', tensor([1.0533]))])
OrderedDict([('linear.weight', tensor([[2.0023]])), ('linear.bias', tensor([1.0475]))])
OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0462]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0495]))])
OrderedDict([('linear.weight', tensor([[2.0048]])), ('linear.bias', tensor([1.0554]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9985]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0441]))])
OrderedDict([('linear.weight', tensor([[1.9944]])), ('linear.bias', tensor([1.0431]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0465]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[1.9957]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0485]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0553]))])
OrderedDict([('linear.weight', tensor([[1.9939]])), ('linear.bias', tensor([1.0445]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0514]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0522]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0037]])), ('linear.bias', tensor([1.0471]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0465]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0471]))])
OrderedDict([('linear.weight', tensor([[2.0088]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[2.0066]])), ('linear.bias', tensor([1.0499]))])
OrderedDict([('linear.weight', tensor([[2.0064]])), ('linear.bias', tensor([1.0539]))])
OrderedDict([('linear.weight', tensor([[2.0052]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0487]))])
OrderedDict([('linear.weight', tensor([[2.0078]])), ('linear.bias', tensor([1.0554]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[2.0051]])), ('linear.bias', tensor([1.0457]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0443]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0449]))])
OrderedDict([('linear.weight', tensor([[1.9964]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0576]))])
OrderedDict([('linear.weight', tensor([[2.0050]])), ('linear.bias', tensor([1.0625]))])
OrderedDict([('linear.weight', tensor([[2.0042]])), ('linear.bias', tensor([1.0589]))])
OrderedDict([('linear.weight', tensor([[2.0013]])), ('linear.bias', tensor([1.0527]))])
OrderedDict([('linear.weight', tensor([[2.0047]])), ('linear.bias', tensor([1.0603]))])
OrderedDict([('linear.weight', tensor([[2.0044]])), ('linear.bias', tensor([1.0596]))])
OrderedDict([('linear.weight', tensor([[2.0024]])), ('linear.bias', tensor([1.0522]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0424]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0473]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0473]))])
OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0474]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[1.9949]])), ('linear.bias', tensor([1.0457]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0474]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0509]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0490]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0517]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0486]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0434]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0463]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0503]))])
OrderedDict([('linear.weight', tensor([[1.9974]])), ('linear.bias', tensor([1.0470]))])
OrderedDict([('linear.weight', tensor([[2.0018]])), ('linear.bias', tensor([1.0572]))])
OrderedDict([('linear.weight', tensor([[2.0024]])), ('linear.bias', tensor([1.0600]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0585]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9924]])), ('linear.bias', tensor([1.0442]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0520]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0612]))])
OrderedDict([('linear.weight', tensor([[2.0040]])), ('linear.bias', tensor([1.0649]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0652]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0665]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0583]))])
OrderedDict([('linear.weight', tensor([[2.0018]])), ('linear.bias', tensor([1.0571]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0648]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0602]))])
OrderedDict([('linear.weight', tensor([[2.0024]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0510]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0479]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0446]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0453]))])
OrderedDict([('linear.weight', tensor([[1.9939]])), ('linear.bias', tensor([1.0462]))])
OrderedDict([('linear.weight', tensor([[1.9939]])), ('linear.bias', tensor([1.0425]))])
OrderedDict([('linear.weight', tensor([[1.9917]])), ('linear.bias', tensor([1.0386]))])
OrderedDict([('linear.weight', tensor([[1.9928]])), ('linear.bias', tensor([1.0405]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0406]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0349]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0409]))])
OrderedDict([('linear.weight', tensor([[1.9948]])), ('linear.bias', tensor([1.0373]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0386]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0426]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0434]))])
OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0503]))])
OrderedDict([('linear.weight', tensor([[2.0026]])), ('linear.bias', tensor([1.0540]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0013]])), ('linear.bias', tensor([1.0548]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0510]))])
OrderedDict([('linear.weight', tensor([[2.0050]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0533]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0525]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0514]))])
OrderedDict([('linear.weight', tensor([[2.0045]])), ('linear.bias', tensor([1.0598]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0529]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0541]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9931]])), ('linear.bias', tensor([1.0364]))])
OrderedDict([('linear.weight', tensor([[1.9918]])), ('linear.bias', tensor([1.0387]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0433]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[2.0036]])), ('linear.bias', tensor([1.0539]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0522]))])
OrderedDict([('linear.weight', tensor([[2.0066]])), ('linear.bias', tensor([1.0617]))])
OrderedDict([('linear.weight', tensor([[2.0090]])), ('linear.bias', tensor([1.0654]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', tensor([[2.0043]])), ('linear.bias', tensor([1.0583]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0544]))])
OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0533]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0481]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0463]))])
OrderedDict([('linear.weight', tensor([[2.0021]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0430]))])
OrderedDict([('linear.weight', tensor([[1.9939]])), ('linear.bias', tensor([1.0377]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0414]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0455]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0489]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0522]))])
OrderedDict([('linear.weight', tensor([[2.0061]])), ('linear.bias', tensor([1.0573]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[2.0060]])), ('linear.bias', tensor([1.0565]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0489]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0434]))])
OrderedDict([('linear.weight', tensor([[2.0001]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0490]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0622]))])
OrderedDict([('linear.weight', tensor([[1.9976]])), ('linear.bias', tensor([1.0607]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0640]))])
OrderedDict([('linear.weight', tensor([[1.9962]])), ('linear.bias', tensor([1.0556]))])
OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0560]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0613]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0585]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0607]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0524]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0455]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0507]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0458]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0475]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0501]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0558]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0535]))])
OrderedDict([('linear.weight', tensor([[2.0040]])), ('linear.bias', tensor([1.0567]))])
OrderedDict([('linear.weight', tensor([[1.9963]])), ('linear.bias', tensor([1.0457]))])
OrderedDict([('linear.weight', tensor([[1.9954]])), ('linear.bias', tensor([1.0400]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0457]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0504]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0458]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0477]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0507]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0448]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0412]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0503]))])
OrderedDict([('linear.weight', tensor([[1.9936]])), ('linear.bias', tensor([1.0460]))])
OrderedDict([('linear.weight', tensor([[1.9935]])), ('linear.bias', tensor([1.0460]))])
OrderedDict([('linear.weight', tensor([[1.9931]])), ('linear.bias', tensor([1.0432]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0074]])), ('linear.bias', tensor([1.0536]))])
OrderedDict([('linear.weight', tensor([[2.0076]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[2.0065]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0468]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0444]))])
OrderedDict([('linear.weight', tensor([[2.0027]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0511]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0465]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0435]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0526]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0500]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0475]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0493]))])
OrderedDict([('linear.weight', tensor([[1.9948]])), ('linear.bias', tensor([1.0475]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', tensor([[1.9980]])), ('linear.bias', tensor([1.0493]))])
OrderedDict([('linear.weight', tensor([[1.9957]])), ('linear.bias', tensor([1.0486]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[1.9948]])), ('linear.bias', tensor([1.0524]))])
OrderedDict([('linear.weight', tensor([[1.9931]])), ('linear.bias', tensor([1.0432]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', tensor([[2.0058]])), ('linear.bias', tensor([1.0634]))])
OrderedDict([('linear.weight', tensor([[2.0057]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[2.0070]])), ('linear.bias', tensor([1.0584]))])
OrderedDict([('linear.weight', tensor([[2.0039]])), ('linear.bias', tensor([1.0542]))])
OrderedDict([('linear.weight', tensor([[2.0036]])), ('linear.bias', tensor([1.0520]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0521]))])
OrderedDict([('linear.weight', tensor([[2.0016]])), ('linear.bias', tensor([1.0499]))])
OrderedDict([('linear.weight', tensor([[2.0057]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', tensor([[2.0061]])), ('linear.bias', tensor([1.0548]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9994]])), ('linear.bias', tensor([1.0593]))])
OrderedDict([('linear.weight', tensor([[1.9931]])), ('linear.bias', tensor([1.0514]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0557]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0536]))])
OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0513]))])
OrderedDict([('linear.weight', tensor([[1.9916]])), ('linear.bias', tensor([1.0426]))])
OrderedDict([('linear.weight', tensor([[1.9925]])), ('linear.bias', tensor([1.0424]))])
OrderedDict([('linear.weight', tensor([[1.9937]])), ('linear.bias', tensor([1.0445]))])
OrderedDict([('linear.weight', tensor([[1.9946]])), ('linear.bias', tensor([1.0455]))])
OrderedDict([('linear.weight', tensor([[1.9928]])), ('linear.bias', tensor([1.0412]))])
OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0449]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0454]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0438]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0506]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0504]))])
OrderedDict([('linear.weight', tensor([[2.0008]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0417]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0418]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0445]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0410]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0350]))])
OrderedDict([('linear.weight', tensor([[1.9962]])), ('linear.bias', tensor([1.0321]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0439]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0498]))])
OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0505]))])
OrderedDict([('linear.weight', tensor([[1.9974]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0495]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0477]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0459]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0464]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0496]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0530]))])
OrderedDict([('linear.weight', tensor([[2.0041]])), ('linear.bias', tensor([1.0585]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9943]])), ('linear.bias', tensor([1.0571]))])
OrderedDict([('linear.weight', tensor([[1.9946]])), ('linear.bias', tensor([1.0568]))])
OrderedDict([('linear.weight', tensor([[1.9916]])), ('linear.bias', tensor([1.0472]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0490]))])
OrderedDict([('linear.weight', tensor([[1.9932]])), ('linear.bias', tensor([1.0459]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0526]))])
OrderedDict([('linear.weight', tensor([[1.9937]])), ('linear.bias', tensor([1.0456]))])
OrderedDict([('linear.weight', tensor([[1.9924]])), ('linear.bias', tensor([1.0438]))])
OrderedDict([('linear.weight', tensor([[1.9931]])), ('linear.bias', tensor([1.0457]))])
OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9936]])), ('linear.bias', tensor([1.0562]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0624]))])
OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0620]))])
OrderedDict([('linear.weight', tensor([[1.9974]])), ('linear.bias', tensor([1.0597]))])
OrderedDict([('linear.weight', tensor([[1.9990]])), ('linear.bias', tensor([1.0591]))])
OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0504]))])
OrderedDict([('linear.weight', tensor([[2.0005]])), ('linear.bias', tensor([1.0567]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0608]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0588]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0469]))])
OrderedDict([('linear.weight', tensor([[2.0040]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0487]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0543]))])
OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0520]))])
OrderedDict([('linear.weight', tensor([[2.0020]])), ('linear.bias', tensor([1.0598]))])
OrderedDict([('linear.weight', tensor([[2.0038]])), ('linear.bias', tensor([1.0634]))])
OrderedDict([('linear.weight', tensor([[2.0017]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[2.0019]])), ('linear.bias', tensor([1.0568]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0509]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0536]))])
OrderedDict([('linear.weight', tensor([[1.9988]])), ('linear.bias', tensor([1.0560]))])
OrderedDict([('linear.weight', tensor([[1.9958]])), ('linear.bias', tensor([1.0521]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0544]))])
OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0517]))])
OrderedDict([('linear.weight', tensor([[1.9921]])), ('linear.bias', tensor([1.0434]))])
OrderedDict([('linear.weight', tensor([[1.9964]])), ('linear.bias', tensor([1.0509]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0540]))])
OrderedDict([('linear.weight', tensor([[1.9935]])), ('linear.bias', tensor([1.0485]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0528]))])
OrderedDict([('linear.weight', tensor([[1.9943]])), ('linear.bias', tensor([1.0497]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0498]))])
OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0516]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0492]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0505]))])
OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0446]))])
OrderedDict([('linear.weight', tensor([[2.0000]])), ('linear.bias', tensor([1.0500]))])
OrderedDict([('linear.weight', tensor([[2.0030]])), ('linear.bias', tensor([1.0505]))])
OrderedDict([('linear.weight', tensor([[2.0042]])), ('linear.bias', tensor([1.0560]))])
OrderedDict([('linear.weight', tensor([[2.0054]])), ('linear.bias', tensor([1.0551]))])
OrderedDict([('linear.weight', tensor([[2.0070]])), ('linear.bias', tensor([1.0596]))])
OrderedDict([('linear.weight', tensor([[2.0029]])), ('linear.bias', tensor([1.0519]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9945]])), ('linear.bias', tensor([1.0457]))])
OrderedDict([('linear.weight', tensor([[1.9958]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', tensor([[1.9927]])), ('linear.bias', tensor([1.0452]))])
OrderedDict([('linear.weight', tensor([[1.9895]])), ('linear.bias', tensor([1.0385]))])
OrderedDict([('linear.weight', tensor([[1.9924]])), ('linear.bias', tensor([1.0448]))])
OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[1.9943]])), ('linear.bias', tensor([1.0480]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0516]))])
OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0596]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9906]])), ('linear.bias', tensor([1.0468]))])
OrderedDict([('linear.weight', tensor([[1.9905]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[1.9937]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[1.9919]])), ('linear.bias', tensor([1.0435]))])
OrderedDict([('linear.weight', tensor([[1.9898]])), ('linear.bias', tensor([1.0408]))])
OrderedDict([('linear.weight', tensor([[1.9930]])), ('linear.bias', tensor([1.0467]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0520]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0573]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0598]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0581]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0550]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0022]])), ('linear.bias', tensor([1.0551]))])
OrderedDict([('linear.weight', tensor([[2.0028]])), ('linear.bias', tensor([1.0619]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', tensor([[1.9979]])), ('linear.bias', tensor([1.0564]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0595]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0560]))])
OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0518]))])
OrderedDict([('linear.weight', tensor([[1.9950]])), ('linear.bias', tensor([1.0546]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0592]))])
OrderedDict([('linear.weight', tensor([[1.9978]])), ('linear.bias', tensor([1.0579]))])
OrderedDict([('linear.weight', tensor([[1.9937]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9928]])), ('linear.bias', tensor([1.0487]))])
OrderedDict([('linear.weight', tensor([[1.9904]])), ('linear.bias', tensor([1.0497]))])
OrderedDict([('linear.weight', tensor([[1.9914]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0602]))])
OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[1.9938]])), ('linear.bias', tensor([1.0571]))])
OrderedDict([('linear.weight', tensor([[1.9919]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', tensor([[1.9905]])), ('linear.bias', tensor([1.0463]))])
OrderedDict([('linear.weight', tensor([[1.9893]])), ('linear.bias', tensor([1.0498]))])
OrderedDict([('linear.weight', tensor([[1.9909]])), ('linear.bias', tensor([1.0512]))])
OrderedDict([('linear.weight', tensor([[1.9927]])), ('linear.bias', tensor([1.0542]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9951]])), ('linear.bias', tensor([1.0432]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0374]))])
OrderedDict([('linear.weight', tensor([[2.0002]])), ('linear.bias', tensor([1.0468]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0386]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0388]))])
OrderedDict([('linear.weight', tensor([[1.9954]])), ('linear.bias', tensor([1.0360]))])
OrderedDict([('linear.weight', tensor([[2.0023]])), ('linear.bias', tensor([1.0445]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0398]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0379]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[2.0031]])), ('linear.bias', tensor([1.0470]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0439]))])
OrderedDict([('linear.weight', tensor([[1.9966]])), ('linear.bias', tensor([1.0456]))])
OrderedDict([('linear.weight', tensor([[1.9974]])), ('linear.bias', tensor([1.0515]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0507]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0543]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0609]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0589]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0538]))])
OrderedDict([('linear.weight', tensor([[1.9975]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[1.9985]])), ('linear.bias', tensor([1.0533]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0013]])), ('linear.bias', tensor([1.0545]))])
OrderedDict([('linear.weight', tensor([[2.0037]])), ('linear.bias', tensor([1.0603]))])
OrderedDict([('linear.weight', tensor([[2.0034]])), ('linear.bias', tensor([1.0573]))])
OrderedDict([('linear.weight', tensor([[2.0028]])), ('linear.bias', tensor([1.0532]))])
OrderedDict([('linear.weight', tensor([[2.0043]])), ('linear.bias', tensor([1.0586]))])
OrderedDict([('linear.weight', tensor([[2.0045]])), ('linear.bias', tensor([1.0593]))])
OrderedDict([('linear.weight', tensor([[2.0061]])), ('linear.bias', tensor([1.0642]))])
OrderedDict([('linear.weight', tensor([[2.0006]])), ('linear.bias', tensor([1.0585]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0520]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0481]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0478]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0024]])), ('linear.bias', tensor([1.0543]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[1.9989]])), ('linear.bias', tensor([1.0503]))])
OrderedDict([('linear.weight', tensor([[1.9992]])), ('linear.bias', tensor([1.0514]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0516]))])
OrderedDict([('linear.weight', tensor([[1.9982]])), ('linear.bias', tensor([1.0519]))])
OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0526]))])
OrderedDict([('linear.weight', tensor([[1.9927]])), ('linear.bias', tensor([1.0483]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0543]))])
OrderedDict([('linear.weight', tensor([[1.9968]])), ('linear.bias', tensor([1.0513]))])
OrderedDict([('linear.weight', tensor([[1.9957]])), ('linear.bias', tensor([1.0447]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0443]))])
OrderedDict([('linear.weight', tensor([[1.9954]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[1.9957]])), ('linear.bias', tensor([1.0513]))])
OrderedDict([('linear.weight', tensor([[1.9977]])), ('linear.bias', tensor([1.0555]))])
OrderedDict([('linear.weight', tensor([[1.9997]])), ('linear.bias', tensor([1.0582]))])
OrderedDict([('linear.weight', tensor([[2.0011]])), ('linear.bias', tensor([1.0591]))])
OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0575]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0570]))])
OrderedDict([('linear.weight', tensor([[2.0028]])), ('linear.bias', tensor([1.0597]))])
OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0574]))])
OrderedDict([('linear.weight', tensor([[1.9953]])), ('linear.bias', tensor([1.0467]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0014]])), ('linear.bias', tensor([1.0560]))])
OrderedDict([('linear.weight', tensor([[2.0015]])), ('linear.bias', tensor([1.0552]))])
OrderedDict([('linear.weight', tensor([[1.9984]])), ('linear.bias', tensor([1.0511]))])
OrderedDict([('linear.weight', tensor([[1.9961]])), ('linear.bias', tensor([1.0471]))])
OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0474]))])
OrderedDict([('linear.weight', tensor([[1.9959]])), ('linear.bias', tensor([1.0468]))])
OrderedDict([('linear.weight', tensor([[1.9924]])), ('linear.bias', tensor([1.0394]))])
OrderedDict([('linear.weight', tensor([[1.9922]])), ('linear.bias', tensor([1.0389]))])
OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0425]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0443]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0490]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9952]])), ('linear.bias', tensor([1.0585]))])
OrderedDict([('linear.weight', tensor([[1.9944]])), ('linear.bias', tensor([1.0566]))])
OrderedDict([('linear.weight', tensor([[1.9950]])), ('linear.bias', tensor([1.0567]))])
OrderedDict([('linear.weight', tensor([[1.9974]])), ('linear.bias', tensor([1.0604]))])
OrderedDict([('linear.weight', tensor([[1.9971]])), ('linear.bias', tensor([1.0577]))])
OrderedDict([('linear.weight', tensor([[1.9943]])), ('linear.bias', tensor([1.0476]))])
OrderedDict([('linear.weight', tensor([[1.9970]])), ('linear.bias', tensor([1.0481]))])
OrderedDict([('linear.weight', tensor([[1.9969]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[1.9943]])), ('linear.bias', tensor([1.0423]))])
OrderedDict([('linear.weight', tensor([[1.9960]])), ('linear.bias', tensor([1.0442]))])
OrderedDict([('linear.weight', tensor([[1.9995]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0523]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0534]))])
OrderedDict([('linear.weight', tensor([[1.9987]])), ('linear.bias', tensor([1.0455]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0458]))])
OrderedDict([('linear.weight', tensor([[2.0033]])), ('linear.bias', tensor([1.0549]))])
OrderedDict([('linear.weight', tensor([[2.0033]])), ('linear.bias', tensor([1.0548]))])
OrderedDict([('linear.weight', tensor([[2.0035]])), ('linear.bias', tensor([1.0563]))])
OrderedDict([('linear.weight', tensor([[2.0054]])), ('linear.bias', tensor([1.0590]))])
OrderedDict([('linear.weight', tensor([[2.0032]])), ('linear.bias', tensor([1.0564]))])
OrderedDict([('linear.weight', tensor([[2.0021]])), ('linear.bias', tensor([1.0553]))])
OrderedDict([('linear.weight', tensor([[2.0009]])), ('linear.bias', tensor([1.0547]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9956]])), ('linear.bias', tensor([1.0400]))])
OrderedDict([('linear.weight', tensor([[1.9967]])), ('linear.bias', tensor([1.0406]))])
OrderedDict([('linear.weight', tensor([[1.9973]])), ('linear.bias', tensor([1.0431]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0488]))])
OrderedDict([('linear.weight', tensor([[2.0004]])), ('linear.bias', tensor([1.0522]))])
OrderedDict([('linear.weight', tensor([[1.9981]])), ('linear.bias', tensor([1.0481]))])
OrderedDict([('linear.weight', tensor([[1.9983]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', tensor([[1.9999]])), ('linear.bias', tensor([1.0491]))])
OrderedDict([('linear.weight', tensor([[2.0012]])), ('linear.bias', tensor([1.0500]))])
OrderedDict([('linear.weight', tensor([[2.0007]])), ('linear.bias', tensor([1.0494]))])
OrderedDict([('linear.weight', tensor([[1.9998]])), ('linear.bias', tensor([1.0484]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[1.9955]])), ('linear.bias', tensor([1.0466]))])
OrderedDict([('linear.weight', tensor([[1.9940]])), ('linear.bias', tensor([1.0414]))])
OrderedDict([('linear.weight', tensor([[1.9916]])), ('linear.bias', tensor([1.0430]))])
OrderedDict([('linear.weight', tensor([[1.9942]])), ('linear.bias', tensor([1.0522]))])
OrderedDict([('linear.weight', tensor([[1.9944]])), ('linear.bias', tensor([1.0555]))])
OrderedDict([('linear.weight', tensor([[1.9954]])), ('linear.bias', tensor([1.0535]))])
OrderedDict([('linear.weight', tensor([[1.9958]])), ('linear.bias', tensor([1.0549]))])
OrderedDict([('linear.weight', tensor([[1.9926]])), ('linear.bias', tensor([1.0461]))])
OrderedDict([('linear.weight', tensor([[1.9891]])), ('linear.bias', tensor([1.0402]))])
OrderedDict([('linear.weight', tensor([[1.9883]])), ('linear.bias', tensor([1.0372]))])
OrderedDict([('linear.weight', tensor([[1.9910]])), ('linear.bias', tensor([1.0416]))])
OrderedDict([('linear.weight', t

OrderedDict([('linear.weight', tensor([[2.0038]])), ('linear.bias', tensor([1.0539]))])
OrderedDict([('linear.weight', tensor([[2.0038]])), ('linear.bias', tensor([1.0539]))])
OrderedDict([('linear.weight', tensor([[2.0046]])), ('linear.bias', tensor([1.0536]))])
OrderedDict([('linear.weight', tensor([[2.0056]])), ('linear.bias', tensor([1.0561]))])
OrderedDict([('linear.weight', tensor([[2.0025]])), ('linear.bias', tensor([1.0508]))])
OrderedDict([('linear.weight', tensor([[1.9972]])), ('linear.bias', tensor([1.0449]))])
OrderedDict([('linear.weight', tensor([[2.0010]])), ('linear.bias', tensor([1.0492]))])
OrderedDict([('linear.weight', tensor([[1.9986]])), ('linear.bias', tensor([1.0463]))])
OrderedDict([('linear.weight', tensor([[1.9965]])), ('linear.bias', tensor([1.0441]))])
OrderedDict([('linear.weight', tensor([[1.9991]])), ('linear.bias', tensor([1.0463]))])
OrderedDict([('linear.weight', tensor([[1.9993]])), ('linear.bias', tensor([1.0444]))])
OrderedDict([('linear.weight', t

In [37]:
# Model's parameter before training 
print(model.state_dict())

OrderedDict([('linear.weight', tensor([[2.0054]])), ('linear.bias', tensor([1.0554]))])


In [30]:
# Check model's parameters
#print(model.state_dict())

In [31]:
print(list(model.parameters()))

[Parameter containing:
tensor([[1.9994]], requires_grad=True), Parameter containing:
tensor([1.0510], requires_grad=True)]
