In [16]:
import torch
from torchvision.models import resnet18, ResNet18_Weights
model = resnet18(weights=ResNet18_Weights.DEFAULT)
data = torch.rand(1, 3, 64, 64)
labels = torch.rand(1, 1000)

In [17]:
prediction = model(data) # 순전파 단계(forward pass)

In [18]:
loss = (prediction - labels).sum()
loss.backward() # 역전파 단계(backward pass)

In [19]:
optim = torch.optim.SGD(model.parameters(), lr=1e-2, momentum=0.9)

In [20]:
optim.step() # 경사하강법(gradient descent)

In [21]:
import torch

a = torch.tensor([2., 3.], requires_grad=True)
b = torch.tensor([6., 4.], requires_grad=True)

In [22]:
Q = 3*a**3 - b**2 # Q = 3a^3 - b^2

In [23]:
external_grad = torch.tensor([1., 1.])
Q.backward(gradient=external_grad)

In [24]:
# 수집된 변화도가 올바른지 확인합니다.
print(9*a**2 == a.grad)
print(-2*b == b.grad)

tensor([True, True])
tensor([True, True])


<!-- 방향성 비순환 그래프(DAG; Directed Acyclic Graph) -->

In [25]:
# 방향성 비순환 그래프(DAG; Directed Acyclic Graph)

In [26]:
x = torch.rand(5, 5)
y = torch.rand(5, 5)
z = torch.rand((5, 5), requires_grad=True)

a = x + y
print(f"Does `a` require gradients?: {a.requires_grad}")
b = x + z
print(f"Does `b` require gradients?: {b.requires_grad}")

Does `a` require gradients?: False
Does `b` require gradients?: True


In [27]:
from torch import nn, optim

model = resnet18(weights=ResNet18_Weights.DEFAULT)

# 신경망의 모든 매개변수를 고정합니다
for param in model.parameters():
    param.requires_grad = False

In [28]:
model.fc = nn.Linear(512, 10)

In [29]:
# 분류기만 최적화합니다.
optimizer = optim.SGD(model.parameters(), lr=1e-2, momentum=0.9)