### 优化器，SGD，AdGrad，Adam等

In [1]:
import torch
import torchvision
from torch import nn
from torch.nn import Sequential, Conv2d, MaxPool2d, Flatten, Linear
from torch.optim.lr_scheduler import StepLR
from torch.utils.data import DataLoader

In [2]:
dataset = torchvision.datasets.CIFAR10("./dataset", train=False, transform=torchvision.transforms.ToTensor(),
                                       download=True)

Files already downloaded and verified


In [3]:
dataloader = DataLoader(dataset, batch_size=1)

In [4]:
class Tudui(nn.Module):
    def __init__(self):
        super(Tudui, self).__init__()
        self.model1 = Sequential(
            Conv2d(3, 32, 5, padding=2),
            MaxPool2d(2),
            Conv2d(32, 32, 5, padding=2),
            MaxPool2d(2),
            Conv2d(32, 64, 5, padding=2),
            MaxPool2d(2),
            Flatten(),
            Linear(1024, 64),
            Linear(64, 10)
        )

    def forward(self, x):
        x = self.model1(x)
        return x

In [5]:
loss = nn.CrossEntropyLoss()

In [6]:
tudui = Tudui()

In [12]:
# 模型参数
tudui.parameters

<bound method Module.parameters of Tudui(
  (model1): Sequential(
    (0): Conv2d(3, 32, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
    (1): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
    (2): Conv2d(32, 32, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
    (3): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
    (4): Conv2d(32, 64, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
    (5): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
    (6): Flatten(start_dim=1, end_dim=-1)
    (7): Linear(in_features=1024, out_features=64, bias=True)
    (8): Linear(in_features=64, out_features=10, bias=True)
  )
)>

In [13]:
# 定义SGD优化器
optim = torch.optim.SGD(tudui.parameters(),lr=0.01)

In [14]:
for epoch in range(4):
    loss_sum = 0.0
    for data in dataloader:
        imgs,targets = data
        output = tudui.forward(imgs)
        # 计算出loss
        loss_epoch = loss(output,targets)
        # 优化器中梯度清0
        optim.zero_grad()
        # 反向传播求出每一次的梯度
        loss_epoch.backward()
        # 根据梯度更新参数
        optim.step()
        loss_sum = loss_sum + loss_epoch
    print(loss_sum)

tensor(16110.3340, grad_fn=<AddBackward0>)
tensor(15352.9795, grad_fn=<AddBackward0>)
tensor(15983.9580, grad_fn=<AddBackward0>)
tensor(18037.9023, grad_fn=<AddBackward0>)
