## 3.4 미니배치와 데이터로드

In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F

In [2]:
from torch.utils.data import TensorDataset # 텐서데이터셋
from torch.utils.data import DataLoader # 데이터로더

In [3]:
x_train  =  torch.FloatTensor([[73,  80,  75], 
                               [93,  88,  93], 
                               [89,  91,  90], 
                               [96,  98,  100],   
                               [73,  66,  70]])  
y_train  =  torch.FloatTensor([[152],  [185],  [180],  [196],  [142]])

In [4]:
dataset = TensorDataset(x_train, y_train)

In [5]:
dataloader = DataLoader(dataset, batch_size=2, shuffle=True)

In [6]:
model = nn.Linear(3,1)
optimizer = torch.optim.SGD(model.parameters(), lr=1e-5) 

In [7]:
nb_epochs = 20
for epoch in range(nb_epochs + 1):
  for batch_idx, samples in enumerate(dataloader):
    # print(batch_idx)
    # print(samples)
    x_train, y_train = samples
    # H(x) 계산
    prediction = model(x_train)

    # cost 계산
    cost = F.mse_loss(prediction, y_train)

    # cost로 H(x) 계산
    optimizer.zero_grad()
    cost.backward()
    optimizer.step()

    print('Epoch {:4d}/{} Batch {}/{} Cost: {:.6f}'.format(
        epoch, nb_epochs, batch_idx+1, len(dataloader),
        cost.item()
        ))

Epoch    0/20 Batch 1/3 Cost: 23257.527344
Epoch    0/20 Batch 2/3 Cost: 17672.039062
Epoch    0/20 Batch 3/3 Cost: 3385.473633
Epoch    1/20 Batch 1/3 Cost: 864.252502
Epoch    1/20 Batch 2/3 Cost: 251.374481
Epoch    1/20 Batch 3/3 Cost: 86.673782
Epoch    2/20 Batch 1/3 Cost: 35.489113
Epoch    2/20 Batch 2/3 Cost: 13.626832
Epoch    2/20 Batch 3/3 Cost: 0.394986
Epoch    3/20 Batch 1/3 Cost: 12.455564
Epoch    3/20 Batch 2/3 Cost: 0.078475
Epoch    3/20 Batch 3/3 Cost: 3.066026
Epoch    4/20 Batch 1/3 Cost: 3.280087
Epoch    4/20 Batch 2/3 Cost: 4.944057
Epoch    4/20 Batch 3/3 Cost: 4.782553
Epoch    5/20 Batch 1/3 Cost: 2.771343
Epoch    5/20 Batch 2/3 Cost: 6.105266
Epoch    5/20 Batch 3/3 Cost: 0.111668
Epoch    6/20 Batch 1/3 Cost: 1.355516
Epoch    6/20 Batch 2/3 Cost: 7.863143
Epoch    6/20 Batch 3/3 Cost: 0.797077
Epoch    7/20 Batch 1/3 Cost: 0.954928
Epoch    7/20 Batch 2/3 Cost: 2.446537
Epoch    7/20 Batch 3/3 Cost: 10.253852
Epoch    8/20 Batch 1/3 Cost: 0.887550
Epoch

In [8]:
# 임의의 입력 [73, 80, 75]를 선언
new_var =  torch.FloatTensor([[73, 80, 75]]) 
# 입력한 값 [73, 80, 75]에 대해서 예측값 y를 리턴받아서 pred_y에 저장
pred_y = model(new_var) 
print("훈련 후 입력이 73, 80, 75일 때의 예측값 :", pred_y) 

훈련 후 입력이 73, 80, 75일 때의 예측값 : tensor([[152.5234]], grad_fn=<AddmmBackward0>)


## 4.7 커스텀 데이터셋

In [9]:
import torch
import torch.nn.functional as F

In [10]:
from torch.utils.data import Dataset
from torch.utils.data import DataLoader

In [11]:
# Dataset 상속
class CustomDataset(Dataset): 
  def __init__(self):
    self.x_data = [[73, 80, 75],
                   [93, 88, 93],
                   [89, 91, 90],
                   [96, 98, 100],
                   [73, 66, 70]]
    self.y_data = [[152], [185], [180], [196], [142]]

  # 총 데이터의 개수를 리턴
  def __len__(self): 
    return len(self.x_data)

  # 인덱스를 입력받아 그에 맵핑되는 입출력 데이터를 파이토치의 Tensor 형태로 리턴
  def __getitem__(self, idx): 
    x = torch.FloatTensor(self.x_data[idx])
    y = torch.FloatTensor(self.y_data[idx])
    return x, y


In [12]:
dataset = CustomDataset()
dataloader = DataLoader(dataset, batch_size=2, shuffle=True)

In [13]:
model = torch.nn.Linear(3,1)
optimizer = torch.optim.SGD(model.parameters(), lr=1e-5) 

In [14]:
nb_epochs = 20
for epoch in range(nb_epochs + 1):
  for batch_idx, samples in enumerate(dataloader):
    # print(batch_idx)
    # print(samples)
    x_train, y_train = samples
    # H(x) 계산
    prediction = model(x_train)

    # cost 계산
    cost = F.mse_loss(prediction, y_train)

    # cost로 H(x) 계산
    optimizer.zero_grad()
    cost.backward()
    optimizer.step()

    print('Epoch {:4d}/{} Batch {}/{} Cost: {:.6f}'.format(
        epoch, nb_epochs, batch_idx+1, len(dataloader),
        cost.item()
        ))

Epoch    0/20 Batch 1/3 Cost: 75020.125000
Epoch    0/20 Batch 2/3 Cost: 24831.166016
Epoch    0/20 Batch 3/3 Cost: 12616.029297
Epoch    1/20 Batch 1/3 Cost: 1722.126465
Epoch    1/20 Batch 2/3 Cost: 631.052612
Epoch    1/20 Batch 3/3 Cost: 192.532135
Epoch    2/20 Batch 1/3 Cost: 67.422203
Epoch    2/20 Batch 2/3 Cost: 8.603775
Epoch    2/20 Batch 3/3 Cost: 10.887603
Epoch    3/20 Batch 1/3 Cost: 2.154814
Epoch    3/20 Batch 2/3 Cost: 1.840367
Epoch    3/20 Batch 3/3 Cost: 0.000073
Epoch    4/20 Batch 1/3 Cost: 0.698225
Epoch    4/20 Batch 2/3 Cost: 0.936083
Epoch    4/20 Batch 3/3 Cost: 3.266708
Epoch    5/20 Batch 1/3 Cost: 1.726784
Epoch    5/20 Batch 2/3 Cost: 0.370153
Epoch    5/20 Batch 3/3 Cost: 0.952244
Epoch    6/20 Batch 1/3 Cost: 1.330517
Epoch    6/20 Batch 2/3 Cost: 1.051045
Epoch    6/20 Batch 3/3 Cost: 0.488075
Epoch    7/20 Batch 1/3 Cost: 2.348737
Epoch    7/20 Batch 2/3 Cost: 1.078578
Epoch    7/20 Batch 3/3 Cost: 0.295047
Epoch    8/20 Batch 1/3 Cost: 1.636580
Epoc

In [15]:
# 임의의 입력 [73, 80, 75]를 선언
new_var =  torch.FloatTensor([[73, 80, 75]]) 
# 입력한 값 [73, 80, 75]에 대해서 예측값 y를 리턴받아서 pred_y에 저장
pred_y = model(new_var) 
print("훈련 후 입력이 73, 80, 75일 때의 예측값 :", pred_y) 

훈련 후 입력이 73, 80, 75일 때의 예측값 : tensor([[151.7293]], grad_fn=<AddmmBackward0>)
