In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim

torch.manual_seed(1)

# 훈련 데이터
x1_train = torch.FloatTensor([[73], [93], [89], [96], [73]])
x2_train = torch.FloatTensor([[80], [88], [91], [98], [66]])
x3_train = torch.FloatTensor([[75], [93], [90], [100], [70]])
y_train = torch.FloatTensor([[152], [185], [180], [196], [142]])

# 가중치 w와 편향 b 초기화
w1 = torch.zeros(1, requires_grad=True)
w2 = torch.zeros(1, requires_grad=True)
w3 = torch.zeros(1, requires_grad=True)
b = torch.zeros(1, requires_grad=True)


# optimizer 설정
optimizer = optim.SGD([w1, w2, w3, b], lr=1e-5)

nb_epochs = 1000
for epoch in range(nb_epochs + 1):

    # H(x) 계산
    hypothesis = x1_train * w1 + x2_train * w2 + x3_train * w3 + b

    # cost 계산
    cost = torch.mean((hypothesis - y_train) ** 2)

    # cost로 H(x) 개선
    optimizer.zero_grad()
    cost.backward()
    optimizer.step()

    # 100번마다 로그 출력
    if epoch % 100 == 0:
        print('Epoch {:4d}/{} w1: {:.3f} w2: {:.3f} w3: {:.3f} b: {:.3f} Cost: {:.6f}'.format(
            epoch, nb_epochs, w1.item(), w2.item(), w3.item(), b.item(), cost.item()
        ))

Epoch    0/1000 w1: 0.294 w2: 0.294 w3: 0.297 b: 0.003 Cost: 29661.800781
Epoch  100/1000 w1: 0.674 w2: 0.661 w3: 0.676 b: 0.008 Cost: 1.563634
Epoch  200/1000 w1: 0.679 w2: 0.655 w3: 0.677 b: 0.008 Cost: 1.497607
Epoch  300/1000 w1: 0.684 w2: 0.649 w3: 0.677 b: 0.008 Cost: 1.435026
Epoch  400/1000 w1: 0.689 w2: 0.643 w3: 0.678 b: 0.008 Cost: 1.375730
Epoch  500/1000 w1: 0.694 w2: 0.638 w3: 0.678 b: 0.009 Cost: 1.319511
Epoch  600/1000 w1: 0.699 w2: 0.633 w3: 0.679 b: 0.009 Cost: 1.266222
Epoch  700/1000 w1: 0.704 w2: 0.627 w3: 0.679 b: 0.009 Cost: 1.215696
Epoch  800/1000 w1: 0.709 w2: 0.622 w3: 0.679 b: 0.009 Cost: 1.167818
Epoch  900/1000 w1: 0.713 w2: 0.617 w3: 0.680 b: 0.009 Cost: 1.122429
Epoch 1000/1000 w1: 0.718 w2: 0.613 w3: 0.680 b: 0.009 Cost: 1.079378


In [11]:
# 행렬 연산을 고려하여 파이토치로 구현
x_train  =  torch.FloatTensor([[73,  80,  75], 
                               [93,  88,  93], 
                               [89,  91,  80], 
                               [96,  98,  100],   
                               [73,  66,  70]])  
y_train  =  torch.FloatTensor([[152],  [185],  [180],  [196],  [142]])

print(x_train.shape)
print(y_train.shape)

# 행렬의 곱셈이 성립되려면 
# 곱셈의 좌측에 있는 행렬의 열의 크기와 우측에 있는 행렬의 행의 크기가 일치해야 한다
# x_train = (5x3) w = (3x1)

W = torch.zeros((3, 1), requires_grad=True)
print(W)
b = torch.zeros(1, requires_grad=True)

nb_epochs = 20
for epoch in range(nb_epochs + 1):

    # H(x) 계산
    # 편향 b는 브로드 캐스팅되어 각 샘플에 더해집니다.
    # 샘플 : 전체 훈련 데이터의 개수를 셀 수 있는 1개의 단위
    hypothesis = x_train.matmul(W) + b

    # cost 계산
    cost = torch.mean((hypothesis - y_train) ** 2)

    # cost로 H(x) 개선
    optimizer.zero_grad()
    cost.backward()
    optimizer.step()

    print('Epoch {:4d}/{} hypothesis: {} Cost: {:.6f}'.format(
        epoch, nb_epochs, hypothesis.squeeze(), cost.item()
    ))

    # squeeze() 적용 안하면 아래와 같이 출력
    '''
    Epoch   20/20 hypothesis: tensor([[0.],
        [0.],
        [0.],
        [0.],
        [0.]], grad_fn=<AddBackward0>) Cost: 29661.800781
    '''

torch.Size([5, 3])
torch.Size([5, 1])
tensor([[0.],
        [0.],
        [0.]], requires_grad=True)
Epoch    0/20 hypothesis: tensor([0., 0., 0., 0., 0.], grad_fn=<SqueezeBackward0>) Cost: 29661.800781
Epoch    1/20 hypothesis: tensor([0., 0., 0., 0., 0.], grad_fn=<SqueezeBackward0>) Cost: 29661.800781
Epoch    2/20 hypothesis: tensor([0., 0., 0., 0., 0.], grad_fn=<SqueezeBackward0>) Cost: 29661.800781
Epoch    3/20 hypothesis: tensor([0., 0., 0., 0., 0.], grad_fn=<SqueezeBackward0>) Cost: 29661.800781
Epoch    4/20 hypothesis: tensor([0., 0., 0., 0., 0.], grad_fn=<SqueezeBackward0>) Cost: 29661.800781
Epoch    5/20 hypothesis: tensor([0., 0., 0., 0., 0.], grad_fn=<SqueezeBackward0>) Cost: 29661.800781
Epoch    6/20 hypothesis: tensor([0., 0., 0., 0., 0.], grad_fn=<SqueezeBackward0>) Cost: 29661.800781
Epoch    7/20 hypothesis: tensor([0., 0., 0., 0., 0.], grad_fn=<SqueezeBackward0>) Cost: 29661.800781
Epoch    8/20 hypothesis: tensor([0., 0., 0., 0., 0.], grad_fn=<SqueezeBackward0>) 