In [1]:
import torch
import torch.nn as nn

In [2]:
input = torch.tensor([1,2,3],dtype=torch.float32)
target = torch.tensor([1,2,5],dtype=torch.float32)

In [3]:
input

tensor([1., 2., 3.])

In [4]:
target

tensor([1., 2., 5.])

In [5]:
input = torch.reshape(input,(1,1,1,3))
target = torch.reshape(target,(1,1,1,3))

In [6]:
input

tensor([[[[1., 2., 3.]]]])

In [7]:
target

tensor([[[[1., 2., 5.]]]])

## ## L1Loss  

In [10]:
loss = nn.L1Loss()  # 设置reduction = 'sum' 就是求和，不求均值
result = loss(input,target)

In [11]:
result

tensor(0.6667)

![image.png](attachment:image.png)

##  MSELoss 

In [13]:
loss_mse = nn.MSELoss()
result_mse = loss_mse(input,target) 

In [14]:
result_mse

tensor(1.3333)

![image.png](attachment:image.png)

## CROSSENTROPYLoss

In [16]:
x = torch.tensor([0.1,0.2,0.3])
y = torch.tensor([1])

In [19]:
x = torch.reshape(x,(1,3)) # 有三类
x

tensor([[0.1000, 0.2000, 0.3000]])

In [18]:
loss_cross = nn.CrossEntropyLoss()

In [20]:
result_Cross = loss_cross(x,y)
result_Cross

tensor(1.1019)

![QQ%E5%9B%BE%E7%89%8720220420200629.png](attachment:QQ%E5%9B%BE%E7%89%8720220420200629.png)

## 损失函数实操 

In [21]:
class Model2(nn.Module):
    def __init__(self):
        super(Model2,self).__init__()
        self.model = nn.Sequential(
            nn.Conv2d(3,32,5,padding=2),
            nn.MaxPool2d(2),
            nn.Conv2d(32,32,5,padding=2),
            nn.MaxPool2d(2),
            nn.Conv2d(32,64,5,padding=2),
            nn.MaxPool2d(2),
            nn.Flatten(),
            nn.Linear(1024,64),
            nn.Linear(64,10)
        )
    
    def forward(self,x):
        x = self.model(x)
        return x

In [29]:
import torchvision
from torch.utils.data import DataLoader

In [30]:
dataset = torchvision.datasets.CIFAR10(
    root = "../../../datas",
    train = False,
    download = True,
    transform = torchvision.transforms.ToTensor()
)

Files already downloaded and verified


In [34]:
dataloader = DataLoader(dataset,batch_size=1)

In [35]:
model = Model2()

In [39]:
for data in dataloader:
    imgs,targets = data
    outputs = model(imgs)
#     print(outputs)
#     print(targets)
    result_loss = loss(outputs,targets)
    print(result_loss) #实际输出与目标之间的误差

tensor(8.8419, grad_fn=<MseLossBackward0>)
tensor(63.6145, grad_fn=<MseLossBackward0>)
tensor(63.6883, grad_fn=<MseLossBackward0>)
tensor(0.0080, grad_fn=<MseLossBackward0>)
tensor(35.7185, grad_fn=<MseLossBackward0>)
tensor(35.6802, grad_fn=<MseLossBackward0>)
tensor(0.9537, grad_fn=<MseLossBackward0>)
tensor(35.6765, grad_fn=<MseLossBackward0>)
tensor(8.8858, grad_fn=<MseLossBackward0>)
tensor(0.9573, grad_fn=<MseLossBackward0>)
tensor(0.0074, grad_fn=<MseLossBackward0>)
tensor(80.4855, grad_fn=<MseLossBackward0>)
tensor(24.7315, grad_fn=<MseLossBackward0>)
tensor(48.6315, grad_fn=<MseLossBackward0>)
tensor(80.4770, grad_fn=<MseLossBackward0>)
tensor(63.5788, grad_fn=<MseLossBackward0>)
tensor(24.7731, grad_fn=<MseLossBackward0>)
tensor(48.6468, grad_fn=<MseLossBackward0>)
tensor(63.6704, grad_fn=<MseLossBackward0>)
tensor(35.7315, grad_fn=<MseLossBackward0>)
tensor(48.6081, grad_fn=<MseLossBackward0>)
tensor(0.0094, grad_fn=<MseLossBackward0>)
tensor(15.7779, grad_fn=<MseLossBackwar

tensor(63.5953, grad_fn=<MseLossBackward0>)
tensor(48.6227, grad_fn=<MseLossBackward0>)
tensor(0.9585, grad_fn=<MseLossBackward0>)
tensor(8.8733, grad_fn=<MseLossBackward0>)
tensor(0.0068, grad_fn=<MseLossBackward0>)
tensor(24.7527, grad_fn=<MseLossBackward0>)
tensor(48.5695, grad_fn=<MseLossBackward0>)
tensor(80.6643, grad_fn=<MseLossBackward0>)
tensor(48.6140, grad_fn=<MseLossBackward0>)
tensor(15.8253, grad_fn=<MseLossBackward0>)
tensor(24.7705, grad_fn=<MseLossBackward0>)
tensor(80.6116, grad_fn=<MseLossBackward0>)
tensor(63.5660, grad_fn=<MseLossBackward0>)
tensor(0.0099, grad_fn=<MseLossBackward0>)
tensor(48.6355, grad_fn=<MseLossBackward0>)
tensor(80.5880, grad_fn=<MseLossBackward0>)
tensor(63.6567, grad_fn=<MseLossBackward0>)
tensor(3.9076, grad_fn=<MseLossBackward0>)
tensor(48.6955, grad_fn=<MseLossBackward0>)
tensor(35.7114, grad_fn=<MseLossBackward0>)
tensor(80.6470, grad_fn=<MseLossBackward0>)
tensor(15.8055, grad_fn=<MseLossBackward0>)
tensor(8.8643, grad_fn=<MseLossBackwa

tensor(80.3632, grad_fn=<MseLossBackward0>)
tensor(35.6847, grad_fn=<MseLossBackward0>)
tensor(3.9000, grad_fn=<MseLossBackward0>)
tensor(8.8289, grad_fn=<MseLossBackward0>)
tensor(0.0067, grad_fn=<MseLossBackward0>)
tensor(8.8289, grad_fn=<MseLossBackward0>)
tensor(80.6127, grad_fn=<MseLossBackward0>)
tensor(63.6210, grad_fn=<MseLossBackward0>)
tensor(48.6107, grad_fn=<MseLossBackward0>)
tensor(63.6143, grad_fn=<MseLossBackward0>)
tensor(63.5452, grad_fn=<MseLossBackward0>)
tensor(15.7880, grad_fn=<MseLossBackward0>)
tensor(0.0078, grad_fn=<MseLossBackward0>)
tensor(0.9545, grad_fn=<MseLossBackward0>)
tensor(63.6363, grad_fn=<MseLossBackward0>)
tensor(3.8911, grad_fn=<MseLossBackward0>)
tensor(48.6786, grad_fn=<MseLossBackward0>)
tensor(80.5484, grad_fn=<MseLossBackward0>)
tensor(8.8239, grad_fn=<MseLossBackward0>)
tensor(35.7044, grad_fn=<MseLossBackward0>)
tensor(0.9598, grad_fn=<MseLossBackward0>)
tensor(80.6241, grad_fn=<MseLossBackward0>)
tensor(0.0094, grad_fn=<MseLossBackward0>

tensor(80.5393, grad_fn=<MseLossBackward0>)
tensor(3.9029, grad_fn=<MseLossBackward0>)
tensor(35.7034, grad_fn=<MseLossBackward0>)
tensor(0.9607, grad_fn=<MseLossBackward0>)
tensor(15.8139, grad_fn=<MseLossBackward0>)
tensor(48.6215, grad_fn=<MseLossBackward0>)
tensor(8.8696, grad_fn=<MseLossBackward0>)
tensor(24.7612, grad_fn=<MseLossBackward0>)
tensor(8.8677, grad_fn=<MseLossBackward0>)
tensor(63.6145, grad_fn=<MseLossBackward0>)
tensor(24.7628, grad_fn=<MseLossBackward0>)
tensor(0.0084, grad_fn=<MseLossBackward0>)
tensor(3.9081, grad_fn=<MseLossBackward0>)
tensor(0.9572, grad_fn=<MseLossBackward0>)
tensor(35.7524, grad_fn=<MseLossBackward0>)
tensor(15.7752, grad_fn=<MseLossBackward0>)
tensor(8.8674, grad_fn=<MseLossBackward0>)
tensor(8.8318, grad_fn=<MseLossBackward0>)
tensor(80.5192, grad_fn=<MseLossBackward0>)
tensor(35.6946, grad_fn=<MseLossBackward0>)
tensor(80.6015, grad_fn=<MseLossBackward0>)
tensor(63.6472, grad_fn=<MseLossBackward0>)
tensor(63.6764, grad_fn=<MseLossBackward0

tensor(8.8556, grad_fn=<MseLossBackward0>)
tensor(80.4921, grad_fn=<MseLossBackward0>)
tensor(35.6797, grad_fn=<MseLossBackward0>)
tensor(63.5439, grad_fn=<MseLossBackward0>)
tensor(8.8453, grad_fn=<MseLossBackward0>)
tensor(0.0097, grad_fn=<MseLossBackward0>)
tensor(8.8782, grad_fn=<MseLossBackward0>)
tensor(15.7957, grad_fn=<MseLossBackward0>)
tensor(48.6460, grad_fn=<MseLossBackward0>)
tensor(48.6171, grad_fn=<MseLossBackward0>)
tensor(0.9545, grad_fn=<MseLossBackward0>)
tensor(15.7874, grad_fn=<MseLossBackward0>)
tensor(48.6607, grad_fn=<MseLossBackward0>)
tensor(3.9058, grad_fn=<MseLossBackward0>)
tensor(48.5955, grad_fn=<MseLossBackward0>)
tensor(0.9482, grad_fn=<MseLossBackward0>)
tensor(15.8156, grad_fn=<MseLossBackward0>)
tensor(48.6512, grad_fn=<MseLossBackward0>)
tensor(15.8085, grad_fn=<MseLossBackward0>)
tensor(15.7947, grad_fn=<MseLossBackward0>)
tensor(63.6142, grad_fn=<MseLossBackward0>)
tensor(15.8122, grad_fn=<MseLossBackward0>)
tensor(48.6300, grad_fn=<MseLossBackwar

tensor(15.8142, grad_fn=<MseLossBackward0>)
tensor(48.6093, grad_fn=<MseLossBackward0>)
tensor(63.6407, grad_fn=<MseLossBackward0>)
tensor(8.8663, grad_fn=<MseLossBackward0>)
tensor(0.9587, grad_fn=<MseLossBackward0>)
tensor(3.8842, grad_fn=<MseLossBackward0>)
tensor(0.0083, grad_fn=<MseLossBackward0>)
tensor(0.9482, grad_fn=<MseLossBackward0>)
tensor(24.7197, grad_fn=<MseLossBackward0>)
tensor(63.6704, grad_fn=<MseLossBackward0>)
tensor(15.7998, grad_fn=<MseLossBackward0>)
tensor(35.7414, grad_fn=<MseLossBackward0>)
tensor(8.8350, grad_fn=<MseLossBackward0>)
tensor(63.6128, grad_fn=<MseLossBackward0>)
tensor(0.9523, grad_fn=<MseLossBackward0>)
tensor(8.8726, grad_fn=<MseLossBackward0>)
tensor(63.6019, grad_fn=<MseLossBackward0>)
tensor(24.8006, grad_fn=<MseLossBackward0>)
tensor(0.0074, grad_fn=<MseLossBackward0>)
tensor(63.6045, grad_fn=<MseLossBackward0>)
tensor(15.8107, grad_fn=<MseLossBackward0>)
tensor(63.6079, grad_fn=<MseLossBackward0>)
tensor(0.9452, grad_fn=<MseLossBackward0>

tensor(8.8705, grad_fn=<MseLossBackward0>)
tensor(0.9558, grad_fn=<MseLossBackward0>)
tensor(80.6127, grad_fn=<MseLossBackward0>)
tensor(0.9581, grad_fn=<MseLossBackward0>)
tensor(80.5324, grad_fn=<MseLossBackward0>)
tensor(35.7464, grad_fn=<MseLossBackward0>)
tensor(8.8717, grad_fn=<MseLossBackward0>)
tensor(8.8443, grad_fn=<MseLossBackward0>)
tensor(8.8337, grad_fn=<MseLossBackward0>)
tensor(0.9569, grad_fn=<MseLossBackward0>)
tensor(0.0086, grad_fn=<MseLossBackward0>)
tensor(35.6884, grad_fn=<MseLossBackward0>)
tensor(0.9568, grad_fn=<MseLossBackward0>)
tensor(15.7769, grad_fn=<MseLossBackward0>)
tensor(0.9496, grad_fn=<MseLossBackward0>)
tensor(0.0071, grad_fn=<MseLossBackward0>)
tensor(0.0073, grad_fn=<MseLossBackward0>)
tensor(0.9441, grad_fn=<MseLossBackward0>)
tensor(0.9489, grad_fn=<MseLossBackward0>)
tensor(35.6860, grad_fn=<MseLossBackward0>)
tensor(24.7668, grad_fn=<MseLossBackward0>)
tensor(15.8210, grad_fn=<MseLossBackward0>)
tensor(35.7689, grad_fn=<MseLossBackward0>)
te

tensor(48.6568, grad_fn=<MseLossBackward0>)
tensor(3.8948, grad_fn=<MseLossBackward0>)
tensor(15.7884, grad_fn=<MseLossBackward0>)
tensor(35.6603, grad_fn=<MseLossBackward0>)
tensor(8.8411, grad_fn=<MseLossBackward0>)
tensor(0.9570, grad_fn=<MseLossBackward0>)
tensor(0.0079, grad_fn=<MseLossBackward0>)
tensor(48.6807, grad_fn=<MseLossBackward0>)
tensor(3.8853, grad_fn=<MseLossBackward0>)
tensor(24.7495, grad_fn=<MseLossBackward0>)
tensor(15.8386, grad_fn=<MseLossBackward0>)
tensor(48.5835, grad_fn=<MseLossBackward0>)
tensor(35.7035, grad_fn=<MseLossBackward0>)
tensor(0.9460, grad_fn=<MseLossBackward0>)
tensor(0.9551, grad_fn=<MseLossBackward0>)
tensor(80.5650, grad_fn=<MseLossBackward0>)
tensor(63.6359, grad_fn=<MseLossBackward0>)
tensor(0.9579, grad_fn=<MseLossBackward0>)
tensor(0.0085, grad_fn=<MseLossBackward0>)
tensor(0.9593, grad_fn=<MseLossBackward0>)
tensor(8.8730, grad_fn=<MseLossBackward0>)
tensor(0.9698, grad_fn=<MseLossBackward0>)
tensor(0.9497, grad_fn=<MseLossBackward0>)
t

tensor(0.0073, grad_fn=<MseLossBackward0>)
tensor(35.6857, grad_fn=<MseLossBackward0>)
tensor(3.9002, grad_fn=<MseLossBackward0>)
tensor(80.5893, grad_fn=<MseLossBackward0>)
tensor(0.9598, grad_fn=<MseLossBackward0>)
tensor(48.6614, grad_fn=<MseLossBackward0>)
tensor(48.7220, grad_fn=<MseLossBackward0>)
tensor(24.7229, grad_fn=<MseLossBackward0>)
tensor(3.9152, grad_fn=<MseLossBackward0>)
tensor(24.7721, grad_fn=<MseLossBackward0>)
tensor(35.7138, grad_fn=<MseLossBackward0>)
tensor(15.7867, grad_fn=<MseLossBackward0>)
tensor(0.9572, grad_fn=<MseLossBackward0>)
tensor(15.7712, grad_fn=<MseLossBackward0>)
tensor(8.8680, grad_fn=<MseLossBackward0>)
tensor(8.8527, grad_fn=<MseLossBackward0>)
tensor(8.8304, grad_fn=<MseLossBackward0>)
tensor(0.0070, grad_fn=<MseLossBackward0>)
tensor(8.8355, grad_fn=<MseLossBackward0>)
tensor(24.7359, grad_fn=<MseLossBackward0>)
tensor(24.7535, grad_fn=<MseLossBackward0>)
tensor(63.5564, grad_fn=<MseLossBackward0>)
tensor(80.5987, grad_fn=<MseLossBackward0>

tensor(3.8926, grad_fn=<MseLossBackward0>)
tensor(0.9627, grad_fn=<MseLossBackward0>)
tensor(48.6355, grad_fn=<MseLossBackward0>)
tensor(3.8962, grad_fn=<MseLossBackward0>)
tensor(63.5635, grad_fn=<MseLossBackward0>)
tensor(24.7814, grad_fn=<MseLossBackward0>)
tensor(24.7477, grad_fn=<MseLossBackward0>)
tensor(8.8367, grad_fn=<MseLossBackward0>)
tensor(0.0078, grad_fn=<MseLossBackward0>)
tensor(15.8068, grad_fn=<MseLossBackward0>)
tensor(63.6373, grad_fn=<MseLossBackward0>)
tensor(8.8362, grad_fn=<MseLossBackward0>)
tensor(48.6686, grad_fn=<MseLossBackward0>)
tensor(35.7359, grad_fn=<MseLossBackward0>)
tensor(8.8580, grad_fn=<MseLossBackward0>)
tensor(63.6188, grad_fn=<MseLossBackward0>)
tensor(0.9545, grad_fn=<MseLossBackward0>)
tensor(0.0081, grad_fn=<MseLossBackward0>)
tensor(0.9473, grad_fn=<MseLossBackward0>)
tensor(8.8794, grad_fn=<MseLossBackward0>)
tensor(8.8683, grad_fn=<MseLossBackward0>)
tensor(0.0077, grad_fn=<MseLossBackward0>)
tensor(48.6537, grad_fn=<MseLossBackward0>)
t

tensor(48.6402, grad_fn=<MseLossBackward0>)
tensor(35.6741, grad_fn=<MseLossBackward0>)
tensor(3.8981, grad_fn=<MseLossBackward0>)
tensor(8.8601, grad_fn=<MseLossBackward0>)
tensor(0.0079, grad_fn=<MseLossBackward0>)
tensor(48.7193, grad_fn=<MseLossBackward0>)
tensor(48.6354, grad_fn=<MseLossBackward0>)
tensor(63.6173, grad_fn=<MseLossBackward0>)
tensor(0.9591, grad_fn=<MseLossBackward0>)
tensor(0.9545, grad_fn=<MseLossBackward0>)
tensor(15.7954, grad_fn=<MseLossBackward0>)
tensor(35.6995, grad_fn=<MseLossBackward0>)
tensor(0.0079, grad_fn=<MseLossBackward0>)
tensor(35.7678, grad_fn=<MseLossBackward0>)
tensor(35.7167, grad_fn=<MseLossBackward0>)
tensor(24.7379, grad_fn=<MseLossBackward0>)
tensor(24.7372, grad_fn=<MseLossBackward0>)
tensor(35.7221, grad_fn=<MseLossBackward0>)
tensor(8.8439, grad_fn=<MseLossBackward0>)
tensor(80.5847, grad_fn=<MseLossBackward0>)
tensor(8.8527, grad_fn=<MseLossBackward0>)
tensor(35.6747, grad_fn=<MseLossBackward0>)
tensor(63.6463, grad_fn=<MseLossBackward

tensor(80.4988, grad_fn=<MseLossBackward0>)
tensor(63.6557, grad_fn=<MseLossBackward0>)
tensor(0.0081, grad_fn=<MseLossBackward0>)
tensor(24.7531, grad_fn=<MseLossBackward0>)
tensor(24.8385, grad_fn=<MseLossBackward0>)
tensor(48.6831, grad_fn=<MseLossBackward0>)
tensor(0.9593, grad_fn=<MseLossBackward0>)
tensor(3.9007, grad_fn=<MseLossBackward0>)
tensor(0.0087, grad_fn=<MseLossBackward0>)
tensor(48.6529, grad_fn=<MseLossBackward0>)
tensor(24.7547, grad_fn=<MseLossBackward0>)
tensor(63.6383, grad_fn=<MseLossBackward0>)
tensor(3.8995, grad_fn=<MseLossBackward0>)
tensor(3.9021, grad_fn=<MseLossBackward0>)
tensor(24.7038, grad_fn=<MseLossBackward0>)
tensor(8.8363, grad_fn=<MseLossBackward0>)
tensor(80.5470, grad_fn=<MseLossBackward0>)
tensor(8.8674, grad_fn=<MseLossBackward0>)
tensor(0.9551, grad_fn=<MseLossBackward0>)
tensor(80.5004, grad_fn=<MseLossBackward0>)
tensor(8.8606, grad_fn=<MseLossBackward0>)
tensor(0.9558, grad_fn=<MseLossBackward0>)
tensor(15.7906, grad_fn=<MseLossBackward0>)

tensor(63.7103, grad_fn=<MseLossBackward0>)
tensor(80.5140, grad_fn=<MseLossBackward0>)
tensor(63.6433, grad_fn=<MseLossBackward0>)
tensor(0.9565, grad_fn=<MseLossBackward0>)
tensor(48.5571, grad_fn=<MseLossBackward0>)
tensor(3.8833, grad_fn=<MseLossBackward0>)
tensor(48.6275, grad_fn=<MseLossBackward0>)
tensor(3.9105, grad_fn=<MseLossBackward0>)
tensor(8.8537, grad_fn=<MseLossBackward0>)
tensor(3.9168, grad_fn=<MseLossBackward0>)
tensor(35.7316, grad_fn=<MseLossBackward0>)
tensor(48.6648, grad_fn=<MseLossBackward0>)
tensor(80.4682, grad_fn=<MseLossBackward0>)
tensor(15.7729, grad_fn=<MseLossBackward0>)
tensor(0.0082, grad_fn=<MseLossBackward0>)
tensor(0.9565, grad_fn=<MseLossBackward0>)
tensor(0.0070, grad_fn=<MseLossBackward0>)
tensor(15.8290, grad_fn=<MseLossBackward0>)
tensor(24.7379, grad_fn=<MseLossBackward0>)
tensor(0.0088, grad_fn=<MseLossBackward0>)
tensor(63.6441, grad_fn=<MseLossBackward0>)
tensor(0.0075, grad_fn=<MseLossBackward0>)
tensor(48.6816, grad_fn=<MseLossBackward0>

tensor(48.6392, grad_fn=<MseLossBackward0>)
tensor(35.7075, grad_fn=<MseLossBackward0>)
tensor(3.8875, grad_fn=<MseLossBackward0>)
tensor(15.8009, grad_fn=<MseLossBackward0>)
tensor(48.6063, grad_fn=<MseLossBackward0>)
tensor(48.6761, grad_fn=<MseLossBackward0>)
tensor(35.7327, grad_fn=<MseLossBackward0>)
tensor(15.8074, grad_fn=<MseLossBackward0>)
tensor(3.8964, grad_fn=<MseLossBackward0>)
tensor(3.8971, grad_fn=<MseLossBackward0>)
tensor(8.8643, grad_fn=<MseLossBackward0>)
tensor(3.8928, grad_fn=<MseLossBackward0>)
tensor(15.8034, grad_fn=<MseLossBackward0>)
tensor(80.4783, grad_fn=<MseLossBackward0>)
tensor(0.0079, grad_fn=<MseLossBackward0>)
tensor(0.0087, grad_fn=<MseLossBackward0>)
tensor(80.5879, grad_fn=<MseLossBackward0>)
tensor(35.7050, grad_fn=<MseLossBackward0>)
tensor(24.6979, grad_fn=<MseLossBackward0>)
tensor(63.6159, grad_fn=<MseLossBackward0>)
tensor(24.7912, grad_fn=<MseLossBackward0>)
tensor(3.9290, grad_fn=<MseLossBackward0>)
tensor(15.8165, grad_fn=<MseLossBackward

tensor(15.8145, grad_fn=<MseLossBackward0>)
tensor(24.7668, grad_fn=<MseLossBackward0>)
tensor(24.7545, grad_fn=<MseLossBackward0>)
tensor(3.9043, grad_fn=<MseLossBackward0>)
tensor(48.7077, grad_fn=<MseLossBackward0>)
tensor(48.6444, grad_fn=<MseLossBackward0>)
tensor(35.7209, grad_fn=<MseLossBackward0>)
tensor(0.9588, grad_fn=<MseLossBackward0>)
tensor(3.8977, grad_fn=<MseLossBackward0>)
tensor(8.8268, grad_fn=<MseLossBackward0>)
tensor(48.6482, grad_fn=<MseLossBackward0>)
tensor(24.7453, grad_fn=<MseLossBackward0>)
tensor(15.7736, grad_fn=<MseLossBackward0>)
tensor(8.8578, grad_fn=<MseLossBackward0>)
tensor(48.5980, grad_fn=<MseLossBackward0>)
tensor(48.6611, grad_fn=<MseLossBackward0>)
tensor(0.0076, grad_fn=<MseLossBackward0>)
tensor(0.0084, grad_fn=<MseLossBackward0>)
tensor(0.9576, grad_fn=<MseLossBackward0>)
tensor(15.7686, grad_fn=<MseLossBackward0>)
tensor(15.7841, grad_fn=<MseLossBackward0>)
tensor(8.8441, grad_fn=<MseLossBackward0>)
tensor(48.6412, grad_fn=<MseLossBackward0

tensor(48.6816, grad_fn=<MseLossBackward0>)
tensor(0.0073, grad_fn=<MseLossBackward0>)
tensor(48.7034, grad_fn=<MseLossBackward0>)
tensor(0.0071, grad_fn=<MseLossBackward0>)
tensor(24.7648, grad_fn=<MseLossBackward0>)
tensor(24.7535, grad_fn=<MseLossBackward0>)
tensor(15.7878, grad_fn=<MseLossBackward0>)
tensor(8.8432, grad_fn=<MseLossBackward0>)
tensor(0.0082, grad_fn=<MseLossBackward0>)
tensor(80.4461, grad_fn=<MseLossBackward0>)
tensor(80.5221, grad_fn=<MseLossBackward0>)
tensor(0.0085, grad_fn=<MseLossBackward0>)
tensor(3.9192, grad_fn=<MseLossBackward0>)
tensor(3.9058, grad_fn=<MseLossBackward0>)
tensor(0.0073, grad_fn=<MseLossBackward0>)
tensor(63.5443, grad_fn=<MseLossBackward0>)
tensor(15.7942, grad_fn=<MseLossBackward0>)
tensor(15.7966, grad_fn=<MseLossBackward0>)
tensor(24.7766, grad_fn=<MseLossBackward0>)
tensor(3.9004, grad_fn=<MseLossBackward0>)
tensor(3.9146, grad_fn=<MseLossBackward0>)
tensor(0.9637, grad_fn=<MseLossBackward0>)
tensor(0.9632, grad_fn=<MseLossBackward0>)


tensor(80.5301, grad_fn=<MseLossBackward0>)
tensor(0.9665, grad_fn=<MseLossBackward0>)
tensor(80.5453, grad_fn=<MseLossBackward0>)
tensor(0.0078, grad_fn=<MseLossBackward0>)
tensor(0.9495, grad_fn=<MseLossBackward0>)
tensor(80.5263, grad_fn=<MseLossBackward0>)
tensor(3.8987, grad_fn=<MseLossBackward0>)
tensor(80.5751, grad_fn=<MseLossBackward0>)
tensor(80.5326, grad_fn=<MseLossBackward0>)
tensor(80.5120, grad_fn=<MseLossBackward0>)
tensor(0.0070, grad_fn=<MseLossBackward0>)
tensor(80.5381, grad_fn=<MseLossBackward0>)
tensor(80.5260, grad_fn=<MseLossBackward0>)
tensor(3.9052, grad_fn=<MseLossBackward0>)
tensor(0.9508, grad_fn=<MseLossBackward0>)
tensor(48.6457, grad_fn=<MseLossBackward0>)
tensor(0.0077, grad_fn=<MseLossBackward0>)
tensor(24.7819, grad_fn=<MseLossBackward0>)
tensor(35.7075, grad_fn=<MseLossBackward0>)
tensor(8.8673, grad_fn=<MseLossBackward0>)
tensor(80.6306, grad_fn=<MseLossBackward0>)
tensor(63.6404, grad_fn=<MseLossBackward0>)
tensor(8.8666, grad_fn=<MseLossBackward0>

tensor(24.7719, grad_fn=<MseLossBackward0>)
tensor(15.7676, grad_fn=<MseLossBackward0>)
tensor(63.6313, grad_fn=<MseLossBackward0>)
tensor(80.4762, grad_fn=<MseLossBackward0>)
tensor(48.6354, grad_fn=<MseLossBackward0>)
tensor(15.7974, grad_fn=<MseLossBackward0>)
tensor(15.7966, grad_fn=<MseLossBackward0>)
tensor(0.9649, grad_fn=<MseLossBackward0>)
tensor(3.9052, grad_fn=<MseLossBackward0>)
tensor(15.7580, grad_fn=<MseLossBackward0>)
tensor(80.5953, grad_fn=<MseLossBackward0>)
tensor(63.6427, grad_fn=<MseLossBackward0>)
tensor(48.6814, grad_fn=<MseLossBackward0>)
tensor(80.5498, grad_fn=<MseLossBackward0>)
tensor(24.7002, grad_fn=<MseLossBackward0>)
tensor(0.9450, grad_fn=<MseLossBackward0>)
tensor(3.9077, grad_fn=<MseLossBackward0>)
tensor(0.9617, grad_fn=<MseLossBackward0>)
tensor(35.6784, grad_fn=<MseLossBackward0>)
tensor(35.7297, grad_fn=<MseLossBackward0>)
tensor(15.8036, grad_fn=<MseLossBackward0>)
tensor(24.6978, grad_fn=<MseLossBackward0>)
tensor(48.6968, grad_fn=<MseLossBackw

tensor(0.9625, grad_fn=<MseLossBackward0>)
tensor(48.6156, grad_fn=<MseLossBackward0>)
tensor(35.6580, grad_fn=<MseLossBackward0>)
tensor(0.0082, grad_fn=<MseLossBackward0>)
tensor(80.5782, grad_fn=<MseLossBackward0>)
tensor(8.8804, grad_fn=<MseLossBackward0>)
tensor(24.7411, grad_fn=<MseLossBackward0>)
tensor(8.8616, grad_fn=<MseLossBackward0>)
tensor(3.9192, grad_fn=<MseLossBackward0>)
tensor(24.7210, grad_fn=<MseLossBackward0>)
tensor(8.8612, grad_fn=<MseLossBackward0>)
tensor(15.7662, grad_fn=<MseLossBackward0>)
tensor(80.6069, grad_fn=<MseLossBackward0>)
tensor(48.6411, grad_fn=<MseLossBackward0>)
tensor(0.9546, grad_fn=<MseLossBackward0>)
tensor(15.8013, grad_fn=<MseLossBackward0>)
tensor(15.8042, grad_fn=<MseLossBackward0>)
tensor(35.7263, grad_fn=<MseLossBackward0>)
tensor(0.9629, grad_fn=<MseLossBackward0>)
tensor(8.8457, grad_fn=<MseLossBackward0>)
tensor(63.6222, grad_fn=<MseLossBackward0>)
tensor(63.6167, grad_fn=<MseLossBackward0>)
tensor(0.0067, grad_fn=<MseLossBackward0>

tensor(80.5177, grad_fn=<MseLossBackward0>)
tensor(3.8971, grad_fn=<MseLossBackward0>)
tensor(0.9624, grad_fn=<MseLossBackward0>)
tensor(3.9163, grad_fn=<MseLossBackward0>)
tensor(24.7283, grad_fn=<MseLossBackward0>)
tensor(35.6975, grad_fn=<MseLossBackward0>)
tensor(80.5630, grad_fn=<MseLossBackward0>)
tensor(48.6339, grad_fn=<MseLossBackward0>)
tensor(48.5825, grad_fn=<MseLossBackward0>)
tensor(8.8436, grad_fn=<MseLossBackward0>)
tensor(15.7744, grad_fn=<MseLossBackward0>)
tensor(3.8847, grad_fn=<MseLossBackward0>)
tensor(0.0098, grad_fn=<MseLossBackward0>)
tensor(3.8941, grad_fn=<MseLossBackward0>)
tensor(24.7530, grad_fn=<MseLossBackward0>)
tensor(35.7483, grad_fn=<MseLossBackward0>)
tensor(48.6116, grad_fn=<MseLossBackward0>)
tensor(8.8375, grad_fn=<MseLossBackward0>)
tensor(48.6484, grad_fn=<MseLossBackward0>)
tensor(80.4747, grad_fn=<MseLossBackward0>)
tensor(15.7901, grad_fn=<MseLossBackward0>)
tensor(3.9003, grad_fn=<MseLossBackward0>)
tensor(0.0102, grad_fn=<MseLossBackward0>

tensor(80.5926, grad_fn=<MseLossBackward0>)
tensor(80.4682, grad_fn=<MseLossBackward0>)
tensor(24.7515, grad_fn=<MseLossBackward0>)
tensor(80.5193, grad_fn=<MseLossBackward0>)
tensor(48.6018, grad_fn=<MseLossBackward0>)
tensor(35.7012, grad_fn=<MseLossBackward0>)
tensor(48.6260, grad_fn=<MseLossBackward0>)
tensor(48.7200, grad_fn=<MseLossBackward0>)
tensor(0.9563, grad_fn=<MseLossBackward0>)
tensor(0.9511, grad_fn=<MseLossBackward0>)
tensor(3.9032, grad_fn=<MseLossBackward0>)
tensor(15.7987, grad_fn=<MseLossBackward0>)
tensor(3.9022, grad_fn=<MseLossBackward0>)
tensor(0.0084, grad_fn=<MseLossBackward0>)
tensor(35.6996, grad_fn=<MseLossBackward0>)
tensor(63.5933, grad_fn=<MseLossBackward0>)
tensor(48.6010, grad_fn=<MseLossBackward0>)
tensor(35.7465, grad_fn=<MseLossBackward0>)
tensor(3.8938, grad_fn=<MseLossBackward0>)
tensor(3.8973, grad_fn=<MseLossBackward0>)
tensor(80.5360, grad_fn=<MseLossBackward0>)
tensor(63.5815, grad_fn=<MseLossBackward0>)
tensor(3.8834, grad_fn=<MseLossBackward

tensor(15.7981, grad_fn=<MseLossBackward0>)
tensor(48.6744, grad_fn=<MseLossBackward0>)
tensor(48.5870, grad_fn=<MseLossBackward0>)
tensor(0.0075, grad_fn=<MseLossBackward0>)
tensor(35.7092, grad_fn=<MseLossBackward0>)
tensor(0.9558, grad_fn=<MseLossBackward0>)
tensor(8.8569, grad_fn=<MseLossBackward0>)
tensor(80.6314, grad_fn=<MseLossBackward0>)
tensor(0.0073, grad_fn=<MseLossBackward0>)
tensor(80.5618, grad_fn=<MseLossBackward0>)
tensor(0.0073, grad_fn=<MseLossBackward0>)
tensor(8.8477, grad_fn=<MseLossBackward0>)
tensor(63.6069, grad_fn=<MseLossBackward0>)
tensor(15.8164, grad_fn=<MseLossBackward0>)
tensor(63.5969, grad_fn=<MseLossBackward0>)
tensor(63.5876, grad_fn=<MseLossBackward0>)
tensor(15.8130, grad_fn=<MseLossBackward0>)
tensor(0.9611, grad_fn=<MseLossBackward0>)
tensor(0.0082, grad_fn=<MseLossBackward0>)
tensor(3.9061, grad_fn=<MseLossBackward0>)
tensor(3.9236, grad_fn=<MseLossBackward0>)
tensor(15.8347, grad_fn=<MseLossBackward0>)
tensor(0.9596, grad_fn=<MseLossBackward0>)

tensor(8.8536, grad_fn=<MseLossBackward0>)
tensor(24.7816, grad_fn=<MseLossBackward0>)
tensor(8.8609, grad_fn=<MseLossBackward0>)
tensor(24.7864, grad_fn=<MseLossBackward0>)
tensor(48.5554, grad_fn=<MseLossBackward0>)
tensor(80.7575, grad_fn=<MseLossBackward0>)
tensor(63.6076, grad_fn=<MseLossBackward0>)
tensor(15.8052, grad_fn=<MseLossBackward0>)
tensor(15.7820, grad_fn=<MseLossBackward0>)
tensor(8.8524, grad_fn=<MseLossBackward0>)
tensor(0.9506, grad_fn=<MseLossBackward0>)
tensor(15.8115, grad_fn=<MseLossBackward0>)
tensor(63.6216, grad_fn=<MseLossBackward0>)
tensor(8.8154, grad_fn=<MseLossBackward0>)
tensor(35.7113, grad_fn=<MseLossBackward0>)
tensor(24.7608, grad_fn=<MseLossBackward0>)
tensor(8.8581, grad_fn=<MseLossBackward0>)
tensor(0.0073, grad_fn=<MseLossBackward0>)
tensor(63.6795, grad_fn=<MseLossBackward0>)
tensor(80.5761, grad_fn=<MseLossBackward0>)
tensor(24.7394, grad_fn=<MseLossBackward0>)
tensor(48.6497, grad_fn=<MseLossBackward0>)
tensor(35.6995, grad_fn=<MseLossBackwar

tensor(3.9021, grad_fn=<MseLossBackward0>)
tensor(0.9620, grad_fn=<MseLossBackward0>)
tensor(35.6846, grad_fn=<MseLossBackward0>)
tensor(15.8231, grad_fn=<MseLossBackward0>)
tensor(8.8330, grad_fn=<MseLossBackward0>)
tensor(0.0080, grad_fn=<MseLossBackward0>)
tensor(0.9567, grad_fn=<MseLossBackward0>)
tensor(15.7978, grad_fn=<MseLossBackward0>)
tensor(63.5623, grad_fn=<MseLossBackward0>)
tensor(35.7793, grad_fn=<MseLossBackward0>)
tensor(0.9598, grad_fn=<MseLossBackward0>)
tensor(48.6664, grad_fn=<MseLossBackward0>)
tensor(0.9711, grad_fn=<MseLossBackward0>)
tensor(8.8352, grad_fn=<MseLossBackward0>)
tensor(24.7656, grad_fn=<MseLossBackward0>)
tensor(15.7717, grad_fn=<MseLossBackward0>)
tensor(8.8620, grad_fn=<MseLossBackward0>)
tensor(8.8600, grad_fn=<MseLossBackward0>)
tensor(80.6031, grad_fn=<MseLossBackward0>)
tensor(48.6959, grad_fn=<MseLossBackward0>)
tensor(63.6432, grad_fn=<MseLossBackward0>)
tensor(3.9065, grad_fn=<MseLossBackward0>)
tensor(24.7298, grad_fn=<MseLossBackward0>)

tensor(0.0079, grad_fn=<MseLossBackward0>)
tensor(48.7464, grad_fn=<MseLossBackward0>)
tensor(8.8918, grad_fn=<MseLossBackward0>)
tensor(24.7582, grad_fn=<MseLossBackward0>)
tensor(0.9617, grad_fn=<MseLossBackward0>)
tensor(63.5932, grad_fn=<MseLossBackward0>)
tensor(8.8392, grad_fn=<MseLossBackward0>)
tensor(0.0087, grad_fn=<MseLossBackward0>)
tensor(24.7569, grad_fn=<MseLossBackward0>)
tensor(3.9055, grad_fn=<MseLossBackward0>)
tensor(63.6343, grad_fn=<MseLossBackward0>)
tensor(63.6536, grad_fn=<MseLossBackward0>)
tensor(8.8411, grad_fn=<MseLossBackward0>)
tensor(80.6108, grad_fn=<MseLossBackward0>)
tensor(35.6792, grad_fn=<MseLossBackward0>)
tensor(0.0070, grad_fn=<MseLossBackward0>)
tensor(8.8085, grad_fn=<MseLossBackward0>)
tensor(24.7783, grad_fn=<MseLossBackward0>)
tensor(8.8738, grad_fn=<MseLossBackward0>)
tensor(15.8155, grad_fn=<MseLossBackward0>)
tensor(0.9499, grad_fn=<MseLossBackward0>)
tensor(24.7688, grad_fn=<MseLossBackward0>)
tensor(0.0078, grad_fn=<MseLossBackward0>)


tensor(35.7089, grad_fn=<MseLossBackward0>)
tensor(63.6161, grad_fn=<MseLossBackward0>)
tensor(15.7845, grad_fn=<MseLossBackward0>)
tensor(15.7835, grad_fn=<MseLossBackward0>)
tensor(24.7713, grad_fn=<MseLossBackward0>)
tensor(48.6697, grad_fn=<MseLossBackward0>)
tensor(8.8768, grad_fn=<MseLossBackward0>)
tensor(15.8158, grad_fn=<MseLossBackward0>)
tensor(48.6734, grad_fn=<MseLossBackward0>)
tensor(48.6696, grad_fn=<MseLossBackward0>)
tensor(8.8455, grad_fn=<MseLossBackward0>)
tensor(35.6874, grad_fn=<MseLossBackward0>)
tensor(0.0088, grad_fn=<MseLossBackward0>)
tensor(48.6553, grad_fn=<MseLossBackward0>)
tensor(3.9076, grad_fn=<MseLossBackward0>)
tensor(35.6883, grad_fn=<MseLossBackward0>)
tensor(48.5948, grad_fn=<MseLossBackward0>)
tensor(15.8065, grad_fn=<MseLossBackward0>)
tensor(0.9586, grad_fn=<MseLossBackward0>)
tensor(63.6710, grad_fn=<MseLossBackward0>)
tensor(0.0069, grad_fn=<MseLossBackward0>)
tensor(3.9078, grad_fn=<MseLossBackward0>)
tensor(3.9029, grad_fn=<MseLossBackward

tensor(63.6556, grad_fn=<MseLossBackward0>)
tensor(8.8492, grad_fn=<MseLossBackward0>)
tensor(63.6390, grad_fn=<MseLossBackward0>)
tensor(15.7980, grad_fn=<MseLossBackward0>)
tensor(48.6269, grad_fn=<MseLossBackward0>)
tensor(24.7894, grad_fn=<MseLossBackward0>)
tensor(48.6815, grad_fn=<MseLossBackward0>)
tensor(24.7532, grad_fn=<MseLossBackward0>)
tensor(8.8547, grad_fn=<MseLossBackward0>)
tensor(0.9662, grad_fn=<MseLossBackward0>)
tensor(3.8980, grad_fn=<MseLossBackward0>)
tensor(35.7020, grad_fn=<MseLossBackward0>)
tensor(0.9504, grad_fn=<MseLossBackward0>)
tensor(8.8432, grad_fn=<MseLossBackward0>)
tensor(3.9192, grad_fn=<MseLossBackward0>)
tensor(0.0080, grad_fn=<MseLossBackward0>)
tensor(48.6049, grad_fn=<MseLossBackward0>)
tensor(24.7537, grad_fn=<MseLossBackward0>)
tensor(0.0068, grad_fn=<MseLossBackward0>)
tensor(0.0092, grad_fn=<MseLossBackward0>)
tensor(0.0081, grad_fn=<MseLossBackward0>)
tensor(0.9508, grad_fn=<MseLossBackward0>)
tensor(15.7982, grad_fn=<MseLossBackward0>)


tensor(15.7974, grad_fn=<MseLossBackward0>)
tensor(15.7976, grad_fn=<MseLossBackward0>)
tensor(80.4724, grad_fn=<MseLossBackward0>)
tensor(15.7948, grad_fn=<MseLossBackward0>)
tensor(63.5808, grad_fn=<MseLossBackward0>)
tensor(3.9013, grad_fn=<MseLossBackward0>)
tensor(35.6942, grad_fn=<MseLossBackward0>)
tensor(35.6563, grad_fn=<MseLossBackward0>)
tensor(0.9612, grad_fn=<MseLossBackward0>)
tensor(35.7016, grad_fn=<MseLossBackward0>)
tensor(8.8578, grad_fn=<MseLossBackward0>)
tensor(35.7159, grad_fn=<MseLossBackward0>)
tensor(24.7818, grad_fn=<MseLossBackward0>)
tensor(63.6083, grad_fn=<MseLossBackward0>)
tensor(15.7981, grad_fn=<MseLossBackward0>)
tensor(35.7087, grad_fn=<MseLossBackward0>)
tensor(48.6516, grad_fn=<MseLossBackward0>)
tensor(0.9502, grad_fn=<MseLossBackward0>)
tensor(80.6218, grad_fn=<MseLossBackward0>)
tensor(8.8323, grad_fn=<MseLossBackward0>)
tensor(35.7099, grad_fn=<MseLossBackward0>)
tensor(48.6423, grad_fn=<MseLossBackward0>)
tensor(35.7250, grad_fn=<MseLossBackw

tensor(0.9591, grad_fn=<MseLossBackward0>)
tensor(24.7307, grad_fn=<MseLossBackward0>)
tensor(0.0078, grad_fn=<MseLossBackward0>)
tensor(80.5891, grad_fn=<MseLossBackward0>)
tensor(63.6057, grad_fn=<MseLossBackward0>)
tensor(35.6754, grad_fn=<MseLossBackward0>)
tensor(8.8409, grad_fn=<MseLossBackward0>)
tensor(35.6932, grad_fn=<MseLossBackward0>)
tensor(8.8226, grad_fn=<MseLossBackward0>)
tensor(15.7454, grad_fn=<MseLossBackward0>)
tensor(15.7953, grad_fn=<MseLossBackward0>)
tensor(48.6600, grad_fn=<MseLossBackward0>)
tensor(15.7937, grad_fn=<MseLossBackward0>)
tensor(48.6046, grad_fn=<MseLossBackward0>)
tensor(15.7836, grad_fn=<MseLossBackward0>)
tensor(8.8272, grad_fn=<MseLossBackward0>)
tensor(3.9161, grad_fn=<MseLossBackward0>)
tensor(15.8230, grad_fn=<MseLossBackward0>)
tensor(24.6986, grad_fn=<MseLossBackward0>)
tensor(24.7565, grad_fn=<MseLossBackward0>)
tensor(48.5892, grad_fn=<MseLossBackward0>)
tensor(24.8045, grad_fn=<MseLossBackward0>)
tensor(15.7715, grad_fn=<MseLossBackwa

tensor(24.7489, grad_fn=<MseLossBackward0>)
tensor(8.8559, grad_fn=<MseLossBackward0>)
tensor(63.5946, grad_fn=<MseLossBackward0>)
tensor(3.8873, grad_fn=<MseLossBackward0>)
tensor(15.7804, grad_fn=<MseLossBackward0>)
tensor(3.8974, grad_fn=<MseLossBackward0>)
tensor(3.9006, grad_fn=<MseLossBackward0>)
tensor(35.6724, grad_fn=<MseLossBackward0>)
tensor(48.6333, grad_fn=<MseLossBackward0>)
tensor(35.7143, grad_fn=<MseLossBackward0>)
tensor(0.0083, grad_fn=<MseLossBackward0>)
tensor(24.7313, grad_fn=<MseLossBackward0>)
tensor(24.7866, grad_fn=<MseLossBackward0>)
tensor(63.4871, grad_fn=<MseLossBackward0>)
tensor(15.8066, grad_fn=<MseLossBackward0>)
tensor(24.7502, grad_fn=<MseLossBackward0>)
tensor(35.6885, grad_fn=<MseLossBackward0>)
tensor(0.9578, grad_fn=<MseLossBackward0>)
tensor(8.8462, grad_fn=<MseLossBackward0>)
tensor(24.6692, grad_fn=<MseLossBackward0>)
tensor(15.7794, grad_fn=<MseLossBackward0>)
tensor(48.5812, grad_fn=<MseLossBackward0>)
tensor(8.8725, grad_fn=<MseLossBackward

tensor(15.7912, grad_fn=<MseLossBackward0>)
tensor(63.6655, grad_fn=<MseLossBackward0>)
tensor(15.7911, grad_fn=<MseLossBackward0>)
tensor(8.8454, grad_fn=<MseLossBackward0>)
tensor(0.0077, grad_fn=<MseLossBackward0>)
tensor(15.7832, grad_fn=<MseLossBackward0>)
tensor(0.0066, grad_fn=<MseLossBackward0>)
tensor(0.9555, grad_fn=<MseLossBackward0>)
tensor(80.5342, grad_fn=<MseLossBackward0>)
tensor(8.8697, grad_fn=<MseLossBackward0>)
tensor(0.0082, grad_fn=<MseLossBackward0>)
tensor(8.8539, grad_fn=<MseLossBackward0>)
tensor(35.7035, grad_fn=<MseLossBackward0>)
tensor(24.7495, grad_fn=<MseLossBackward0>)
tensor(24.7322, grad_fn=<MseLossBackward0>)
tensor(3.8992, grad_fn=<MseLossBackward0>)
tensor(63.6065, grad_fn=<MseLossBackward0>)
tensor(24.6858, grad_fn=<MseLossBackward0>)
tensor(0.0071, grad_fn=<MseLossBackward0>)
tensor(63.6831, grad_fn=<MseLossBackward0>)
tensor(48.6280, grad_fn=<MseLossBackward0>)
tensor(24.7588, grad_fn=<MseLossBackward0>)
tensor(3.8996, grad_fn=<MseLossBackward0>

tensor(63.6063, grad_fn=<MseLossBackward0>)
tensor(3.8956, grad_fn=<MseLossBackward0>)
tensor(35.6979, grad_fn=<MseLossBackward0>)
tensor(15.7802, grad_fn=<MseLossBackward0>)
tensor(48.6252, grad_fn=<MseLossBackward0>)
tensor(80.5296, grad_fn=<MseLossBackward0>)
tensor(24.7900, grad_fn=<MseLossBackward0>)
tensor(48.6198, grad_fn=<MseLossBackward0>)
tensor(3.9064, grad_fn=<MseLossBackward0>)
tensor(35.6724, grad_fn=<MseLossBackward0>)
tensor(3.9133, grad_fn=<MseLossBackward0>)
tensor(0.9618, grad_fn=<MseLossBackward0>)
tensor(80.5204, grad_fn=<MseLossBackward0>)
tensor(80.5697, grad_fn=<MseLossBackward0>)
tensor(48.6565, grad_fn=<MseLossBackward0>)
tensor(3.8987, grad_fn=<MseLossBackward0>)
tensor(24.7475, grad_fn=<MseLossBackward0>)
tensor(0.9705, grad_fn=<MseLossBackward0>)
tensor(63.6403, grad_fn=<MseLossBackward0>)
tensor(0.9632, grad_fn=<MseLossBackward0>)
tensor(35.7147, grad_fn=<MseLossBackward0>)
tensor(8.8329, grad_fn=<MseLossBackward0>)
tensor(0.0079, grad_fn=<MseLossBackward0

tensor(15.7784, grad_fn=<MseLossBackward0>)
tensor(63.6418, grad_fn=<MseLossBackward0>)
tensor(15.7858, grad_fn=<MseLossBackward0>)
tensor(35.6975, grad_fn=<MseLossBackward0>)
tensor(3.9015, grad_fn=<MseLossBackward0>)
tensor(3.9009, grad_fn=<MseLossBackward0>)
tensor(3.9102, grad_fn=<MseLossBackward0>)
tensor(35.6566, grad_fn=<MseLossBackward0>)
tensor(8.8637, grad_fn=<MseLossBackward0>)
tensor(15.7873, grad_fn=<MseLossBackward0>)
tensor(0.0087, grad_fn=<MseLossBackward0>)
tensor(63.6355, grad_fn=<MseLossBackward0>)
tensor(0.9491, grad_fn=<MseLossBackward0>)
tensor(8.8691, grad_fn=<MseLossBackward0>)
tensor(63.5583, grad_fn=<MseLossBackward0>)
tensor(8.8361, grad_fn=<MseLossBackward0>)
tensor(63.6319, grad_fn=<MseLossBackward0>)
tensor(80.5829, grad_fn=<MseLossBackward0>)
tensor(0.9509, grad_fn=<MseLossBackward0>)
tensor(35.7375, grad_fn=<MseLossBackward0>)
tensor(0.9497, grad_fn=<MseLossBackward0>)
tensor(80.5329, grad_fn=<MseLossBackward0>)
tensor(63.6168, grad_fn=<MseLossBackward0>

tensor(80.6307, grad_fn=<MseLossBackward0>)
tensor(0.9558, grad_fn=<MseLossBackward0>)
tensor(0.0077, grad_fn=<MseLossBackward0>)
tensor(35.7293, grad_fn=<MseLossBackward0>)
tensor(24.7285, grad_fn=<MseLossBackward0>)
tensor(8.8644, grad_fn=<MseLossBackward0>)
tensor(0.0068, grad_fn=<MseLossBackward0>)
tensor(80.5736, grad_fn=<MseLossBackward0>)
tensor(0.0077, grad_fn=<MseLossBackward0>)
tensor(35.6729, grad_fn=<MseLossBackward0>)
tensor(3.8810, grad_fn=<MseLossBackward0>)
tensor(0.0075, grad_fn=<MseLossBackward0>)
tensor(15.8010, grad_fn=<MseLossBackward0>)
tensor(0.9584, grad_fn=<MseLossBackward0>)
tensor(35.7118, grad_fn=<MseLossBackward0>)
tensor(48.6341, grad_fn=<MseLossBackward0>)
tensor(35.7121, grad_fn=<MseLossBackward0>)
tensor(0.9513, grad_fn=<MseLossBackward0>)
tensor(0.0075, grad_fn=<MseLossBackward0>)
tensor(15.8153, grad_fn=<MseLossBackward0>)
tensor(35.7066, grad_fn=<MseLossBackward0>)
tensor(0.0092, grad_fn=<MseLossBackward0>)
tensor(15.7844, grad_fn=<MseLossBackward0>)

tensor(8.8807, grad_fn=<MseLossBackward0>)
tensor(0.9534, grad_fn=<MseLossBackward0>)
tensor(24.7380, grad_fn=<MseLossBackward0>)
tensor(15.8039, grad_fn=<MseLossBackward0>)
tensor(24.7463, grad_fn=<MseLossBackward0>)
tensor(0.9600, grad_fn=<MseLossBackward0>)
tensor(63.5765, grad_fn=<MseLossBackward0>)
tensor(80.5481, grad_fn=<MseLossBackward0>)
tensor(0.9498, grad_fn=<MseLossBackward0>)
tensor(8.8810, grad_fn=<MseLossBackward0>)
tensor(0.9594, grad_fn=<MseLossBackward0>)
tensor(48.6524, grad_fn=<MseLossBackward0>)
tensor(3.9105, grad_fn=<MseLossBackward0>)
tensor(80.5801, grad_fn=<MseLossBackward0>)
tensor(63.6620, grad_fn=<MseLossBackward0>)
tensor(80.5336, grad_fn=<MseLossBackward0>)
tensor(15.7771, grad_fn=<MseLossBackward0>)
tensor(35.6837, grad_fn=<MseLossBackward0>)
tensor(0.0092, grad_fn=<MseLossBackward0>)
tensor(80.4912, grad_fn=<MseLossBackward0>)
tensor(15.8095, grad_fn=<MseLossBackward0>)
tensor(0.0072, grad_fn=<MseLossBackward0>)
tensor(15.7885, grad_fn=<MseLossBackward0

tensor(0.9612, grad_fn=<MseLossBackward0>)
tensor(0.9565, grad_fn=<MseLossBackward0>)
tensor(3.8957, grad_fn=<MseLossBackward0>)
tensor(63.6314, grad_fn=<MseLossBackward0>)
tensor(3.8895, grad_fn=<MseLossBackward0>)
tensor(35.6912, grad_fn=<MseLossBackward0>)
tensor(80.6004, grad_fn=<MseLossBackward0>)
tensor(15.8026, grad_fn=<MseLossBackward0>)
tensor(63.6100, grad_fn=<MseLossBackward0>)
tensor(15.8105, grad_fn=<MseLossBackward0>)
tensor(15.8030, grad_fn=<MseLossBackward0>)
tensor(0.9682, grad_fn=<MseLossBackward0>)
tensor(24.7557, grad_fn=<MseLossBackward0>)
tensor(3.9036, grad_fn=<MseLossBackward0>)
tensor(35.7058, grad_fn=<MseLossBackward0>)
tensor(80.5100, grad_fn=<MseLossBackward0>)
tensor(3.8922, grad_fn=<MseLossBackward0>)
tensor(0.0079, grad_fn=<MseLossBackward0>)
tensor(48.6246, grad_fn=<MseLossBackward0>)
tensor(0.9688, grad_fn=<MseLossBackward0>)
tensor(63.5896, grad_fn=<MseLossBackward0>)
tensor(80.4626, grad_fn=<MseLossBackward0>)
tensor(8.8745, grad_fn=<MseLossBackward0>

tensor(0.9600, grad_fn=<MseLossBackward0>)
tensor(24.7733, grad_fn=<MseLossBackward0>)
tensor(15.8085, grad_fn=<MseLossBackward0>)
tensor(0.0078, grad_fn=<MseLossBackward0>)
tensor(63.5660, grad_fn=<MseLossBackward0>)
tensor(15.8061, grad_fn=<MseLossBackward0>)
tensor(80.5148, grad_fn=<MseLossBackward0>)
tensor(63.6072, grad_fn=<MseLossBackward0>)
tensor(48.6290, grad_fn=<MseLossBackward0>)
tensor(63.6870, grad_fn=<MseLossBackward0>)
tensor(15.7960, grad_fn=<MseLossBackward0>)
tensor(3.9021, grad_fn=<MseLossBackward0>)
tensor(8.8615, grad_fn=<MseLossBackward0>)
tensor(15.8144, grad_fn=<MseLossBackward0>)
tensor(0.0063, grad_fn=<MseLossBackward0>)
tensor(24.8040, grad_fn=<MseLossBackward0>)
tensor(15.8030, grad_fn=<MseLossBackward0>)
tensor(0.9625, grad_fn=<MseLossBackward0>)
tensor(63.6380, grad_fn=<MseLossBackward0>)
tensor(3.8996, grad_fn=<MseLossBackward0>)
tensor(24.7556, grad_fn=<MseLossBackward0>)
tensor(15.8043, grad_fn=<MseLossBackward0>)
tensor(24.7483, grad_fn=<MseLossBackwar

tensor(0.0073, grad_fn=<MseLossBackward0>)
tensor(8.8243, grad_fn=<MseLossBackward0>)
tensor(24.7933, grad_fn=<MseLossBackward0>)
tensor(24.7286, grad_fn=<MseLossBackward0>)
tensor(8.8533, grad_fn=<MseLossBackward0>)
tensor(63.5689, grad_fn=<MseLossBackward0>)
tensor(48.5935, grad_fn=<MseLossBackward0>)
tensor(48.6348, grad_fn=<MseLossBackward0>)
tensor(80.5215, grad_fn=<MseLossBackward0>)
tensor(35.7248, grad_fn=<MseLossBackward0>)
tensor(24.7492, grad_fn=<MseLossBackward0>)
tensor(63.6289, grad_fn=<MseLossBackward0>)
tensor(80.4727, grad_fn=<MseLossBackward0>)
tensor(0.0075, grad_fn=<MseLossBackward0>)
tensor(0.9649, grad_fn=<MseLossBackward0>)
tensor(80.6531, grad_fn=<MseLossBackward0>)
tensor(15.7940, grad_fn=<MseLossBackward0>)
tensor(0.0075, grad_fn=<MseLossBackward0>)
tensor(0.0072, grad_fn=<MseLossBackward0>)
tensor(0.9524, grad_fn=<MseLossBackward0>)
tensor(48.6236, grad_fn=<MseLossBackward0>)
tensor(3.9060, grad_fn=<MseLossBackward0>)
tensor(3.9184, grad_fn=<MseLossBackward0>

tensor(0.9574, grad_fn=<MseLossBackward0>)
tensor(8.8482, grad_fn=<MseLossBackward0>)
tensor(15.7765, grad_fn=<MseLossBackward0>)
tensor(35.6523, grad_fn=<MseLossBackward0>)
tensor(80.5658, grad_fn=<MseLossBackward0>)
tensor(0.9608, grad_fn=<MseLossBackward0>)
tensor(0.0076, grad_fn=<MseLossBackward0>)
tensor(48.5865, grad_fn=<MseLossBackward0>)
tensor(0.9595, grad_fn=<MseLossBackward0>)
tensor(80.5225, grad_fn=<MseLossBackward0>)
tensor(24.7629, grad_fn=<MseLossBackward0>)
tensor(63.5430, grad_fn=<MseLossBackward0>)
tensor(0.9561, grad_fn=<MseLossBackward0>)
tensor(80.5655, grad_fn=<MseLossBackward0>)
tensor(80.5311, grad_fn=<MseLossBackward0>)
tensor(48.7416, grad_fn=<MseLossBackward0>)
tensor(80.5733, grad_fn=<MseLossBackward0>)
tensor(63.6147, grad_fn=<MseLossBackward0>)
tensor(8.8284, grad_fn=<MseLossBackward0>)
tensor(0.0086, grad_fn=<MseLossBackward0>)
tensor(3.8933, grad_fn=<MseLossBackward0>)
tensor(35.7302, grad_fn=<MseLossBackward0>)
tensor(0.0085, grad_fn=<MseLossBackward0>

tensor(0.9508, grad_fn=<MseLossBackward0>)
tensor(24.8110, grad_fn=<MseLossBackward0>)
tensor(3.9163, grad_fn=<MseLossBackward0>)
tensor(3.9073, grad_fn=<MseLossBackward0>)
tensor(48.6199, grad_fn=<MseLossBackward0>)
tensor(80.6070, grad_fn=<MseLossBackward0>)
tensor(8.8532, grad_fn=<MseLossBackward0>)
tensor(80.5226, grad_fn=<MseLossBackward0>)
tensor(8.8535, grad_fn=<MseLossBackward0>)
tensor(24.7838, grad_fn=<MseLossBackward0>)
tensor(3.9152, grad_fn=<MseLossBackward0>)
tensor(3.9108, grad_fn=<MseLossBackward0>)
tensor(3.9021, grad_fn=<MseLossBackward0>)
tensor(63.6453, grad_fn=<MseLossBackward0>)
tensor(63.5341, grad_fn=<MseLossBackward0>)
tensor(24.7990, grad_fn=<MseLossBackward0>)
tensor(0.0099, grad_fn=<MseLossBackward0>)
tensor(0.0089, grad_fn=<MseLossBackward0>)
tensor(48.6464, grad_fn=<MseLossBackward0>)
tensor(0.0086, grad_fn=<MseLossBackward0>)
tensor(8.8409, grad_fn=<MseLossBackward0>)
tensor(0.9552, grad_fn=<MseLossBackward0>)
tensor(35.6490, grad_fn=<MseLossBackward0>)
t

tensor(63.5777, grad_fn=<MseLossBackward0>)
tensor(3.9116, grad_fn=<MseLossBackward0>)
tensor(63.6069, grad_fn=<MseLossBackward0>)
tensor(15.8033, grad_fn=<MseLossBackward0>)
tensor(0.0081, grad_fn=<MseLossBackward0>)
tensor(63.5248, grad_fn=<MseLossBackward0>)
tensor(8.8501, grad_fn=<MseLossBackward0>)
tensor(35.6525, grad_fn=<MseLossBackward0>)
tensor(0.9570, grad_fn=<MseLossBackward0>)
tensor(3.9020, grad_fn=<MseLossBackward0>)
tensor(8.8507, grad_fn=<MseLossBackward0>)
tensor(0.0082, grad_fn=<MseLossBackward0>)
tensor(24.7498, grad_fn=<MseLossBackward0>)
tensor(0.0083, grad_fn=<MseLossBackward0>)
tensor(15.7989, grad_fn=<MseLossBackward0>)
tensor(0.9529, grad_fn=<MseLossBackward0>)
tensor(48.6082, grad_fn=<MseLossBackward0>)
tensor(3.8950, grad_fn=<MseLossBackward0>)
tensor(0.0069, grad_fn=<MseLossBackward0>)
tensor(0.9494, grad_fn=<MseLossBackward0>)
tensor(8.8481, grad_fn=<MseLossBackward0>)
tensor(80.5622, grad_fn=<MseLossBackward0>)
tensor(0.9557, grad_fn=<MseLossBackward0>)
te

tensor(80.5470, grad_fn=<MseLossBackward0>)
tensor(8.8187, grad_fn=<MseLossBackward0>)
tensor(35.6757, grad_fn=<MseLossBackward0>)
tensor(48.6701, grad_fn=<MseLossBackward0>)
tensor(0.9566, grad_fn=<MseLossBackward0>)
tensor(63.6338, grad_fn=<MseLossBackward0>)
tensor(8.8397, grad_fn=<MseLossBackward0>)
tensor(80.4964, grad_fn=<MseLossBackward0>)
tensor(63.6036, grad_fn=<MseLossBackward0>)
tensor(48.6394, grad_fn=<MseLossBackward0>)
tensor(63.6907, grad_fn=<MseLossBackward0>)
tensor(63.6068, grad_fn=<MseLossBackward0>)
tensor(0.0091, grad_fn=<MseLossBackward0>)
tensor(8.8355, grad_fn=<MseLossBackward0>)
tensor(3.9153, grad_fn=<MseLossBackward0>)
tensor(15.7911, grad_fn=<MseLossBackward0>)
tensor(63.6269, grad_fn=<MseLossBackward0>)
tensor(48.6033, grad_fn=<MseLossBackward0>)
tensor(24.7528, grad_fn=<MseLossBackward0>)
tensor(48.5982, grad_fn=<MseLossBackward0>)
tensor(0.9566, grad_fn=<MseLossBackward0>)
tensor(63.5774, grad_fn=<MseLossBackward0>)
tensor(48.5428, grad_fn=<MseLossBackwar

tensor(35.6610, grad_fn=<MseLossBackward0>)
tensor(0.9534, grad_fn=<MseLossBackward0>)
tensor(63.6746, grad_fn=<MseLossBackward0>)
tensor(48.6353, grad_fn=<MseLossBackward0>)
tensor(8.8618, grad_fn=<MseLossBackward0>)
tensor(3.9447, grad_fn=<MseLossBackward0>)
tensor(3.9038, grad_fn=<MseLossBackward0>)
tensor(35.6665, grad_fn=<MseLossBackward0>)
tensor(24.7913, grad_fn=<MseLossBackward0>)
tensor(35.6802, grad_fn=<MseLossBackward0>)
tensor(80.6293, grad_fn=<MseLossBackward0>)
tensor(3.9018, grad_fn=<MseLossBackward0>)
tensor(24.7355, grad_fn=<MseLossBackward0>)
tensor(15.8427, grad_fn=<MseLossBackward0>)
tensor(80.5916, grad_fn=<MseLossBackward0>)
tensor(63.5786, grad_fn=<MseLossBackward0>)
tensor(24.7129, grad_fn=<MseLossBackward0>)
tensor(8.8372, grad_fn=<MseLossBackward0>)
tensor(80.5620, grad_fn=<MseLossBackward0>)
tensor(8.8687, grad_fn=<MseLossBackward0>)
tensor(24.7934, grad_fn=<MseLossBackward0>)
tensor(48.6081, grad_fn=<MseLossBackward0>)
tensor(0.9635, grad_fn=<MseLossBackward

tensor(35.6549, grad_fn=<MseLossBackward0>)
tensor(35.7102, grad_fn=<MseLossBackward0>)
tensor(15.7899, grad_fn=<MseLossBackward0>)
tensor(0.0081, grad_fn=<MseLossBackward0>)
tensor(48.6544, grad_fn=<MseLossBackward0>)
tensor(0.9497, grad_fn=<MseLossBackward0>)
tensor(48.5948, grad_fn=<MseLossBackward0>)
tensor(8.8443, grad_fn=<MseLossBackward0>)
tensor(0.0071, grad_fn=<MseLossBackward0>)
tensor(63.5728, grad_fn=<MseLossBackward0>)
tensor(0.9647, grad_fn=<MseLossBackward0>)
tensor(3.9040, grad_fn=<MseLossBackward0>)
tensor(15.7873, grad_fn=<MseLossBackward0>)
tensor(0.9502, grad_fn=<MseLossBackward0>)
tensor(3.9257, grad_fn=<MseLossBackward0>)
tensor(3.9176, grad_fn=<MseLossBackward0>)
tensor(15.7765, grad_fn=<MseLossBackward0>)
tensor(80.6224, grad_fn=<MseLossBackward0>)
tensor(63.6498, grad_fn=<MseLossBackward0>)
tensor(3.8968, grad_fn=<MseLossBackward0>)
tensor(63.6196, grad_fn=<MseLossBackward0>)
tensor(48.6639, grad_fn=<MseLossBackward0>)
tensor(35.7384, grad_fn=<MseLossBackward0>

tensor(80.5015, grad_fn=<MseLossBackward0>)
tensor(35.7198, grad_fn=<MseLossBackward0>)
tensor(35.7418, grad_fn=<MseLossBackward0>)
tensor(35.6918, grad_fn=<MseLossBackward0>)
tensor(63.6229, grad_fn=<MseLossBackward0>)
tensor(48.6392, grad_fn=<MseLossBackward0>)
tensor(15.7899, grad_fn=<MseLossBackward0>)
tensor(0.9528, grad_fn=<MseLossBackward0>)
tensor(63.6474, grad_fn=<MseLossBackward0>)
tensor(0.9723, grad_fn=<MseLossBackward0>)
tensor(3.8943, grad_fn=<MseLossBackward0>)
tensor(3.9042, grad_fn=<MseLossBackward0>)
tensor(15.7974, grad_fn=<MseLossBackward0>)
tensor(63.6436, grad_fn=<MseLossBackward0>)
tensor(24.6900, grad_fn=<MseLossBackward0>)
tensor(3.9022, grad_fn=<MseLossBackward0>)
tensor(35.7284, grad_fn=<MseLossBackward0>)
tensor(24.7312, grad_fn=<MseLossBackward0>)
tensor(8.8492, grad_fn=<MseLossBackward0>)
tensor(80.4496, grad_fn=<MseLossBackward0>)
tensor(0.9476, grad_fn=<MseLossBackward0>)
tensor(0.0093, grad_fn=<MseLossBackward0>)
tensor(48.6123, grad_fn=<MseLossBackward

tensor(63.5691, grad_fn=<MseLossBackward0>)
tensor(80.4869, grad_fn=<MseLossBackward0>)
tensor(48.6085, grad_fn=<MseLossBackward0>)
tensor(0.0089, grad_fn=<MseLossBackward0>)
tensor(8.8497, grad_fn=<MseLossBackward0>)
tensor(63.5362, grad_fn=<MseLossBackward0>)
tensor(0.0078, grad_fn=<MseLossBackward0>)
tensor(24.7823, grad_fn=<MseLossBackward0>)
tensor(80.6519, grad_fn=<MseLossBackward0>)
tensor(24.7552, grad_fn=<MseLossBackward0>)
tensor(63.5972, grad_fn=<MseLossBackward0>)
tensor(15.7904, grad_fn=<MseLossBackward0>)
tensor(3.9051, grad_fn=<MseLossBackward0>)
tensor(0.0068, grad_fn=<MseLossBackward0>)
tensor(80.5375, grad_fn=<MseLossBackward0>)
tensor(3.9164, grad_fn=<MseLossBackward0>)
tensor(3.8971, grad_fn=<MseLossBackward0>)
tensor(15.7995, grad_fn=<MseLossBackward0>)
tensor(15.7757, grad_fn=<MseLossBackward0>)
tensor(80.6479, grad_fn=<MseLossBackward0>)
tensor(3.8962, grad_fn=<MseLossBackward0>)
tensor(3.8913, grad_fn=<MseLossBackward0>)
tensor(3.9080, grad_fn=<MseLossBackward0>

tensor(80.5157, grad_fn=<MseLossBackward0>)
tensor(24.7618, grad_fn=<MseLossBackward0>)
tensor(35.6649, grad_fn=<MseLossBackward0>)
tensor(80.5651, grad_fn=<MseLossBackward0>)
tensor(8.8481, grad_fn=<MseLossBackward0>)
tensor(80.5206, grad_fn=<MseLossBackward0>)
tensor(63.5818, grad_fn=<MseLossBackward0>)
tensor(48.6083, grad_fn=<MseLossBackward0>)
tensor(48.6811, grad_fn=<MseLossBackward0>)
tensor(0.9606, grad_fn=<MseLossBackward0>)
tensor(35.7306, grad_fn=<MseLossBackward0>)
tensor(24.7414, grad_fn=<MseLossBackward0>)
tensor(8.8468, grad_fn=<MseLossBackward0>)
tensor(0.9589, grad_fn=<MseLossBackward0>)
tensor(8.8692, grad_fn=<MseLossBackward0>)
tensor(0.9524, grad_fn=<MseLossBackward0>)
tensor(3.9025, grad_fn=<MseLossBackward0>)
tensor(48.6292, grad_fn=<MseLossBackward0>)
tensor(0.9542, grad_fn=<MseLossBackward0>)
tensor(63.6013, grad_fn=<MseLossBackward0>)
tensor(3.9097, grad_fn=<MseLossBackward0>)
tensor(0.0083, grad_fn=<MseLossBackward0>)
tensor(80.5774, grad_fn=<MseLossBackward0>

tensor(24.7645, grad_fn=<MseLossBackward0>)
tensor(48.6663, grad_fn=<MseLossBackward0>)
tensor(63.6590, grad_fn=<MseLossBackward0>)
tensor(0.0071, grad_fn=<MseLossBackward0>)
tensor(24.7267, grad_fn=<MseLossBackward0>)
tensor(0.0075, grad_fn=<MseLossBackward0>)
tensor(48.5885, grad_fn=<MseLossBackward0>)
tensor(15.8350, grad_fn=<MseLossBackward0>)
tensor(63.5923, grad_fn=<MseLossBackward0>)
tensor(3.8815, grad_fn=<MseLossBackward0>)
tensor(24.6916, grad_fn=<MseLossBackward0>)
tensor(0.9548, grad_fn=<MseLossBackward0>)
tensor(8.8617, grad_fn=<MseLossBackward0>)
tensor(3.9028, grad_fn=<MseLossBackward0>)
tensor(3.9189, grad_fn=<MseLossBackward0>)
tensor(35.6972, grad_fn=<MseLossBackward0>)
tensor(3.9038, grad_fn=<MseLossBackward0>)
tensor(0.9509, grad_fn=<MseLossBackward0>)
tensor(48.6582, grad_fn=<MseLossBackward0>)
tensor(15.7775, grad_fn=<MseLossBackward0>)
tensor(35.7114, grad_fn=<MseLossBackward0>)
tensor(8.8254, grad_fn=<MseLossBackward0>)
tensor(0.9543, grad_fn=<MseLossBackward0>)

tensor(80.5473, grad_fn=<MseLossBackward0>)
tensor(0.9532, grad_fn=<MseLossBackward0>)
tensor(35.6661, grad_fn=<MseLossBackward0>)
tensor(48.6562, grad_fn=<MseLossBackward0>)
tensor(3.8904, grad_fn=<MseLossBackward0>)
tensor(0.0092, grad_fn=<MseLossBackward0>)
tensor(0.9591, grad_fn=<MseLossBackward0>)
tensor(48.7001, grad_fn=<MseLossBackward0>)
tensor(35.6960, grad_fn=<MseLossBackward0>)
tensor(24.7373, grad_fn=<MseLossBackward0>)
tensor(3.8852, grad_fn=<MseLossBackward0>)
tensor(3.9020, grad_fn=<MseLossBackward0>)
tensor(24.7095, grad_fn=<MseLossBackward0>)
tensor(35.7226, grad_fn=<MseLossBackward0>)
tensor(0.0074, grad_fn=<MseLossBackward0>)
tensor(80.5278, grad_fn=<MseLossBackward0>)
tensor(0.0074, grad_fn=<MseLossBackward0>)
tensor(0.9499, grad_fn=<MseLossBackward0>)
tensor(24.7429, grad_fn=<MseLossBackward0>)
tensor(8.8234, grad_fn=<MseLossBackward0>)
tensor(8.8421, grad_fn=<MseLossBackward0>)
tensor(24.7897, grad_fn=<MseLossBackward0>)
tensor(63.6429, grad_fn=<MseLossBackward0>)

tensor(0.0068, grad_fn=<MseLossBackward0>)
tensor(24.7732, grad_fn=<MseLossBackward0>)
tensor(0.9723, grad_fn=<MseLossBackward0>)
tensor(3.9028, grad_fn=<MseLossBackward0>)
tensor(0.0079, grad_fn=<MseLossBackward0>)
tensor(15.8162, grad_fn=<MseLossBackward0>)
tensor(80.7076, grad_fn=<MseLossBackward0>)
tensor(24.7035, grad_fn=<MseLossBackward0>)
tensor(0.9549, grad_fn=<MseLossBackward0>)
tensor(3.9023, grad_fn=<MseLossBackward0>)
tensor(3.8873, grad_fn=<MseLossBackward0>)
tensor(48.6366, grad_fn=<MseLossBackward0>)
tensor(63.5600, grad_fn=<MseLossBackward0>)
tensor(48.6679, grad_fn=<MseLossBackward0>)
tensor(3.9087, grad_fn=<MseLossBackward0>)
tensor(15.7830, grad_fn=<MseLossBackward0>)
tensor(24.7488, grad_fn=<MseLossBackward0>)
tensor(8.8602, grad_fn=<MseLossBackward0>)
tensor(15.7566, grad_fn=<MseLossBackward0>)
tensor(0.0079, grad_fn=<MseLossBackward0>)
tensor(35.6611, grad_fn=<MseLossBackward0>)
tensor(0.9604, grad_fn=<MseLossBackward0>)
tensor(24.7601, grad_fn=<MseLossBackward0>)

## 优化器与反向传播 

In [46]:
# 设置优化器
optim = torch.optim.SGD(model.parameters(),lr=0.01) # lr:学习速率

# 设置损失函数
loss = torch.nn.CrossEntropyLoss()

In [47]:
for epoch in range(20):        # 20轮学习
    running_loss = 0.0
    for data in dataloader:
        imgs,targets = data
        outputs = model(imgs)
        result_loss = loss(outputs,targets)
        optim.zero_grad()      # 归零设置
        result_loss.backward() # 计算参数结点梯度，反向传播
        optim.step()           # 对模型参数调优
        running_loss = running_loss + result_loss
    print(running_loss)

tensor(18724.4316, grad_fn=<AddBackward0>)
tensor(16168.3994, grad_fn=<AddBackward0>)
tensor(15496.1885, grad_fn=<AddBackward0>)
tensor(16028.2285, grad_fn=<AddBackward0>)
tensor(17854.3359, grad_fn=<AddBackward0>)
tensor(20226.9043, grad_fn=<AddBackward0>)
tensor(22024.8867, grad_fn=<AddBackward0>)
tensor(23296.9961, grad_fn=<AddBackward0>)
tensor(24412.8105, grad_fn=<AddBackward0>)
tensor(24831.4668, grad_fn=<AddBackward0>)
tensor(25119.8281, grad_fn=<AddBackward0>)
tensor(25933.5312, grad_fn=<AddBackward0>)
tensor(26550.5352, grad_fn=<AddBackward0>)
tensor(26990.6855, grad_fn=<AddBackward0>)
tensor(27693.2715, grad_fn=<AddBackward0>)
tensor(28878.5762, grad_fn=<AddBackward0>)
tensor(30447.3770, grad_fn=<AddBackward0>)
tensor(nan, grad_fn=<AddBackward0>)
tensor(nan, grad_fn=<AddBackward0>)
tensor(nan, grad_fn=<AddBackward0>)
