<a href="https://colab.research.google.com/github/jaejinnn/pytorch/blob/main/240113.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

## 03-05 클래스로 파이토치 모델 구현하기

### 1. 모델을 클래스로 구현하기

In [2]:
import torch
import torch.nn as nn
import torch.nn.functional as F

In [3]:
# 모델을 선언 및 초기화. 단순 선형 회귀이므로 input_dim=1, output_dim=1.
model = nn.Linear(1,1)

In [4]:
class LinearRegressionModel(nn.Module): # torch.nn.Module을 상속받는 파이썬 클래스
    def __init__(self): #
        super().__init__()
        self.linear = nn.Linear(1, 1) # 단순 선형 회귀이므로 input_dim=1, output_dim=1.

    def forward(self, x):
        return self.linear(x)

In [5]:
model = LinearRegressionModel()

In [9]:
# 모델을 선언 및 초기화. 다중 선형 회귀이므로 input_dim=3, output_dim=1.
model = nn.Linear(3,1)

In [10]:
class MultivariateLinearRegressionModel(nn.Module):
    def __init__(self):
        super().__init__()
        self.linear = nn.Linear(3, 1) # 다중 선형 회귀이므로 input_dim=3, output_dim=1.

    def forward(self, x):
        return self.linear(x)

In [12]:
model = MultivariateLinearRegressionModel()

### 2. 단순 선형 회귀 클래스로 구현하기

In [13]:
import torch
import torch.nn as nn
import torch.nn.functional as F

In [15]:
torch.manual_seed(1)

<torch._C.Generator at 0x7aee22721450>

In [16]:
# 데이터
x_train = torch.FloatTensor([[1], [2], [3]])
y_train = torch.FloatTensor([[2], [4], [6]])

In [17]:
class LinearRegressionModel(nn.Module):
    def __init__(self):
        super().__init__()
        self.linear = nn.Linear(1, 1)

    def forward(self, x):
        return self.linear(x)

In [19]:
model = LinearRegressionModel()

In [20]:
# optimizer 설정. 경사 하강법 SGD를 사용하고 learning rate를 의미하는 lr은 0.01
optimizer = torch.optim.SGD(model.parameters(), lr=0.01)

In [21]:
# 전체 훈련 데이터에 대해 경사 하강법을 2,000회 반복
nb_epochs = 2000
for epoch in range(nb_epochs+1):

    # H(x) 계산
    prediction = model(x_train)

    # cost 계산
    cost = F.mse_loss(prediction, y_train) # <== 파이토치에서 제공하는 평균 제곱 오차 함수

    # cost로 H(x) 개선하는 부분
    # gradient를 0으로 초기화
    optimizer.zero_grad()
    # 비용 함수를 미분하여 gradient 계산
    cost.backward() # backward 연산
    # W와 b를 업데이트
    optimizer.step()

    if epoch % 100 == 0:
    # 100번마다 로그 출력
      print('Epoch {:4d}/{} Cost: {:.6f}'.format(
          epoch, nb_epochs, cost.item()
      ))

Epoch    0/2000 Cost: 18.562185
Epoch  100/2000 Cost: 0.128051
Epoch  200/2000 Cost: 0.079128
Epoch  300/2000 Cost: 0.048896
Epoch  400/2000 Cost: 0.030215
Epoch  500/2000 Cost: 0.018671
Epoch  600/2000 Cost: 0.011538
Epoch  700/2000 Cost: 0.007129
Epoch  800/2000 Cost: 0.004406
Epoch  900/2000 Cost: 0.002722
Epoch 1000/2000 Cost: 0.001682
Epoch 1100/2000 Cost: 0.001040
Epoch 1200/2000 Cost: 0.000642
Epoch 1300/2000 Cost: 0.000397
Epoch 1400/2000 Cost: 0.000245
Epoch 1500/2000 Cost: 0.000152
Epoch 1600/2000 Cost: 0.000094
Epoch 1700/2000 Cost: 0.000058
Epoch 1800/2000 Cost: 0.000036
Epoch 1900/2000 Cost: 0.000022
Epoch 2000/2000 Cost: 0.000014


### 3. 다중 선형 회귀 클래스로 구현하기

In [22]:
import torch
import torch.nn as nn
import torch.nn.functional as F

In [24]:
torch.manual_seed(1)

<torch._C.Generator at 0x7aee22721450>

In [25]:
# 데이터
x_train = torch.FloatTensor([[73, 80, 75],
                             [93, 88, 93],
                             [89, 91, 90],
                             [96, 98, 100],
                             [73, 66, 70]])
y_train = torch.FloatTensor([[152], [185], [180], [196], [142]])

In [26]:
class MultivariateLinearRegressionModel(nn.Module):
    def __init__(self):
        super().__init__()
        self.linear = nn.Linear(3, 1) # 다중 선형 회귀이므로 input_dim=3, output_dim=1.

    def forward(self, x):
        return self.linear(x)

In [28]:
model = MultivariateLinearRegressionModel()

In [29]:
optimizer = torch.optim.SGD(model.parameters(), lr=1e-5)

In [30]:
nb_epochs = 2000
for epoch in range(nb_epochs+1):

    # H(x) 계산
    prediction = model(x_train)
    # model(x_train)은 model.forward(x_train)와 동일함.

    # cost 계산
    cost = F.mse_loss(prediction, y_train) # <== 파이토치에서 제공하는 평균 제곱 오차 함수

    # cost로 H(x) 개선하는 부분
    # gradient를 0으로 초기화
    optimizer.zero_grad()
    # 비용 함수를 미분하여 gradient 계산
    cost.backward()
    # W와 b를 업데이트
    optimizer.step()

    if epoch % 100 == 0:
    # 100번마다 로그 출력
      print('Epoch {:4d}/{} Cost: {:.6f}'.format(
          epoch, nb_epochs, cost.item()
      ))

Epoch    0/2000 Cost: 39633.414062
Epoch  100/2000 Cost: 11.480746
Epoch  200/2000 Cost: 10.894592
Epoch  300/2000 Cost: 10.339335
Epoch  400/2000 Cost: 9.813341
Epoch  500/2000 Cost: 9.314991
Epoch  600/2000 Cost: 8.842943
Epoch  700/2000 Cost: 8.395709
Epoch  800/2000 Cost: 7.972019
Epoch  900/2000 Cost: 7.570613
Epoch 1000/2000 Cost: 7.190366
Epoch 1100/2000 Cost: 6.830102
Epoch 1200/2000 Cost: 6.488800
Epoch 1300/2000 Cost: 6.165435
Epoch 1400/2000 Cost: 5.859081
Epoch 1500/2000 Cost: 5.568858
Epoch 1600/2000 Cost: 5.293914
Epoch 1700/2000 Cost: 5.033381
Epoch 1800/2000 Cost: 4.786536
Epoch 1900/2000 Cost: 4.552677
Epoch 2000/2000 Cost: 4.331120


## 03-06 미니 배치와 데이터 로드(Mini Batch and Data Load)

### 1. 미니 배치와 배치 크기(Mini Batch and Batch Size)

In [31]:
x_train = torch.FloatTensor([[73, 80, 75],
                             [93, 88, 93],
                             [89, 91, 90],
                             [96, 98, 100],
                             [73, 66, 70]])
y_train = torch.FloatTensor([[152], [185], [180], [196], [142]])

### 2. 이터레이션(Iteration)

### 3. 데이터 로드하기(Data Load)

In [32]:
import torch
import torch.nn as nn
import torch.nn.functional as F

In [33]:
from torch.utils.data import TensorDataset # 텐서데이터셋
from torch.utils.data import DataLoader # 데이터로더

In [56]:
x_train  =  torch.FloatTensor([[73,  80,  75],
                               [93,  88,  93],
                               [89,  91,  90],
                               [96,  98,  100],
                               [73,  66,  70]])
y_train  =  torch.FloatTensor([[152],  [185],  [180],  [196],  [142]])

In [57]:
dataset = TensorDataset(x_train, y_train)

In [58]:
dataloader = DataLoader(dataset, batch_size=2, shuffle=True)

In [59]:
model = nn.Linear(3,1)
optimizer = torch.optim.SGD(model.parameters(), lr=1e-5)

In [60]:
nb_epochs = 20
for epoch in range(nb_epochs + 1):
  for batch_idx, samples in enumerate(dataloader):
    # print(batch_idx)
    # print(samples)
    x_train, y_train = samples
    # H(x) 계산
    prediction = model(x_train)

    # cost 계산
    cost = F.mse_loss(prediction, y_train)

    # cost로 H(x) 계산
    optimizer.zero_grad()
    cost.backward()
    optimizer.step()

    print('Epoch {:4d}/{} Batch {}/{} Cost: {:.6f}'.format(
        epoch, nb_epochs, batch_idx+1, len(dataloader),
        cost.item()
        ))

Epoch    0/20 Batch 1/3 Cost: 8343.354492
Epoch    0/20 Batch 2/3 Cost: 1426.161499
Epoch    0/20 Batch 3/3 Cost: 1112.988403
Epoch    1/20 Batch 1/3 Cost: 200.030579
Epoch    1/20 Batch 2/3 Cost: 30.962631
Epoch    1/20 Batch 3/3 Cost: 11.880800
Epoch    2/20 Batch 1/3 Cost: 5.754392
Epoch    2/20 Batch 2/3 Cost: 2.274139
Epoch    2/20 Batch 3/3 Cost: 0.024620
Epoch    3/20 Batch 1/3 Cost: 0.549288
Epoch    3/20 Batch 2/3 Cost: 0.362169
Epoch    3/20 Batch 3/3 Cost: 0.397599
Epoch    4/20 Batch 1/3 Cost: 0.306390
Epoch    4/20 Batch 2/3 Cost: 0.307105
Epoch    4/20 Batch 3/3 Cost: 0.234279
Epoch    5/20 Batch 1/3 Cost: 0.392011
Epoch    5/20 Batch 2/3 Cost: 0.270754
Epoch    5/20 Batch 3/3 Cost: 0.202044
Epoch    6/20 Batch 1/3 Cost: 0.319352
Epoch    6/20 Batch 2/3 Cost: 0.232862
Epoch    6/20 Batch 3/3 Cost: 0.741623
Epoch    7/20 Batch 1/3 Cost: 0.449567
Epoch    7/20 Batch 2/3 Cost: 0.289404
Epoch    7/20 Batch 3/3 Cost: 0.388739
Epoch    8/20 Batch 1/3 Cost: 0.077758
Epoch    8/2

In [68]:
# 임의의 입력 [73, 80, 75]를 선언
new_var =  torch.FloatTensor([[73, 80, 75]])
# 입력한 값 [73, 80, 75]에 대해서 예측값 y를 리턴받아서 pred_y에 저장
pred_y = model(new_var)
print("훈련 후 입력이 73, 80, 75일 때의 예측값 :", pred_y)

훈련 후 입력이 73, 80, 75일 때의 예측값 : tensor([[151.7467]], grad_fn=<AddmmBackward0>)


## 03-07 커스텀 데이터셋(Custom Dataset)

### 1. 커스텀 데이터셋(Custom Dataset)

In [None]:
class CustomDataset(torch.utils.data.Dataset):
  def __init__(self):

  def __len__(self):

  def __getitem__(self, idx):

In [70]:
import torch
import torch.nn.functional as F
from torch.utils.data import Dataset
from torch.utils.data import DataLoader

In [71]:
# Dataset 상속
class CustomDataset(Dataset):
  def __init__(self):
    self.x_data = [[73, 80, 75],
                   [93, 88, 93],
                   [89, 91, 90],
                   [96, 98, 100],
                   [73, 66, 70]]
    self.y_data = [[152], [185], [180], [196], [142]]

  # 총 데이터의 개수를 리턴
  def __len__(self):
    return len(self.x_data)

  # 인덱스를 입력받아 그에 맵핑되는 입출력 데이터를 파이토치의 Tensor 형태로 리턴
  def __getitem__(self, idx):
    x = torch.FloatTensor(self.x_data[idx])
    y = torch.FloatTensor(self.y_data[idx])
    return x, y

In [76]:
dataset = CustomDataset()
dataloader = DataLoader(dataset, batch_size=2, shuffle=True)

In [77]:
model = torch.nn.Linear(3,1)
optimizer = torch.optim.SGD(model.parameters(), lr=1e-5)

In [79]:
nb_epochs = 20
for epoch in range(nb_epochs + 1):
  for batch_idx, samples in enumerate(dataloader):
    # print(batch_idx)
    # print(samples)
    x_train, y_train = samples
    # H(x) 계산
    prediction = model(x_train)

    # cost 계산
    cost = F.mse_loss(prediction, y_train)

    # cost로 H(x) 계산
    optimizer.zero_grad()
    cost.backward()
    optimizer.step()

    print('Epoch {:4d}/{} Batch {}/{} Cost: {:.6f}'.format(
        epoch, nb_epochs, batch_idx+1, len(dataloader),
        cost.item()
        ))

Epoch    0/20 Batch 1/3 Cost: 26223.976562
Epoch    0/20 Batch 2/3 Cost: 11275.369141
Epoch    0/20 Batch 3/3 Cost: 4022.767822
Epoch    1/20 Batch 1/3 Cost: 973.816162
Epoch    1/20 Batch 2/3 Cost: 143.515045
Epoch    1/20 Batch 3/3 Cost: 17.435619
Epoch    2/20 Batch 1/3 Cost: 43.817715
Epoch    2/20 Batch 2/3 Cost: 1.350063
Epoch    2/20 Batch 3/3 Cost: 26.018312
Epoch    3/20 Batch 1/3 Cost: 3.357798
Epoch    3/20 Batch 2/3 Cost: 5.251723
Epoch    3/20 Batch 3/3 Cost: 9.332607
Epoch    4/20 Batch 1/3 Cost: 2.698937
Epoch    4/20 Batch 2/3 Cost: 5.873086
Epoch    4/20 Batch 3/3 Cost: 6.788309
Epoch    5/20 Batch 1/3 Cost: 6.273944
Epoch    5/20 Batch 2/3 Cost: 4.461147
Epoch    5/20 Batch 3/3 Cost: 5.619047
Epoch    6/20 Batch 1/3 Cost: 7.004045
Epoch    6/20 Batch 2/3 Cost: 2.389186
Epoch    6/20 Batch 3/3 Cost: 5.168796
Epoch    7/20 Batch 1/3 Cost: 2.243939
Epoch    7/20 Batch 2/3 Cost: 10.275814
Epoch    7/20 Batch 3/3 Cost: 4.214094
Epoch    8/20 Batch 1/3 Cost: 2.555760
Epoch 

In [80]:
# 임의의 입력 [73, 80, 75]를 선언
new_var =  torch.FloatTensor([[73, 80, 75]])
# 입력한 값 [73, 80, 75]에 대해서 예측값 y를 리턴받아서 pred_y에 저장
pred_y = model(new_var)
print("훈련 후 입력이 73, 80, 75일 때의 예측값 :", pred_y)

훈련 후 입력이 73, 80, 75일 때의 예측값 : tensor([[153.8296]], grad_fn=<AddmmBackward0>)
