In [1]:
import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F
import os, random
import numpy as np

from torchvision import transforms, datasets

USE_CUDA = torch.cuda.is_available()
DEVICE = torch.device("cuda" if USE_CUDA else "cpu")
"""
[주의!]
이전 코드는 수정하지 마세요
"""
###################################################################

class MyModel(nn.Module):
    def __init__(self, input_size, hidden_size, num_layers, num_classes):
        super().__init__()
        self.hidden_size = hidden_size
        self.num_layers = num_layers
        self.lstm = nn.LSTM(input_size, hidden_size, num_layers, batch_first=True)
        self.fc = nn.Linear(hidden_size, num_classes)
    
    def forward(self, x):
        # Set initial hidden and cell states 
        h0 = torch.zeros(self.num_layers, x.size(0), self.hidden_size).to(DEVICE) 
        c0 = torch.zeros(self.num_layers, x.size(0), self.hidden_size).to(DEVICE)
        
        # Forward propagate LSTM
        out, _ = self.lstm(x, (h0, c0))  # out: tensor of shape (batch_size, seq_length, hidden_size)
        
        # Decode the hidden state of the last time step
        out = self.fc(out[:, -1, :])
        return out

sequence_length = 28
input_size = 28
hidden_size = 128
num_layers = 2
num_classes = 10
batch_size = 100
num_epochs = 2
learning_rate = 0.01
model = MyModel(input_size, hidden_size, num_layers, num_classes).to(DEVICE)



"""
[주의!]
이후 코드는 수정하지 마세요
"""




SEED = 123
os.environ['PYTHONHASHSEED'] = str(SEED)
random.seed(SEED)
torch.manual_seed(SEED)
np.random.seed(SEED)


if DEVICE.type == "cuda":
    torch.cuda.manual_seed(SEED)
    torch.cuda.manual_seed_all(SEED)
    torch.backends.cudnn.enabled = False
    torch.backends.cudnn.benchmark = False
    torch.backends.cudnn.deterministic = True
 
#model = MyModel().to(DEVICE)
optimizer = optim.SGD(model.parameters(), lr=0.01)
transform = transforms.Compose([
    transforms.ToTensor()
])

trainset = datasets.MNIST(
    root='../.data/',
    train=True,
    download=True,
    transform=transform
)
testset = datasets.MNIST(
    root='../.data/',
    train=False,
    download=True,
    transform=transform
)

BATCH_SIZE = 64

train_loader = torch.utils.data.DataLoader(
    dataset=trainset,
    batch_size=BATCH_SIZE,
    shuffle=True,
)
test_loader = torch.utils.data.DataLoader(
    dataset=testset,
    batch_size=BATCH_SIZE,
    shuffle=True,
)



def train(model, train_loader, optimizer):
    model.train()
    for batch_idx, (data, target) in enumerate(train_loader):

        data, target = data.to(DEVICE), target.to(DEVICE)
        optimizer.zero_grad()
        output = model(data)
        loss = F.cross_entropy(output, target)
        loss.backward()
        optimizer.step()

def evaluate(model, test_loader):
    model.eval()
    test_loss = 0
    correct = 0
    with torch.no_grad():
        for data, target in test_loader:
            data, target = data.to(DEVICE), target.to(DEVICE)
            output = model(data)

            test_loss += F.cross_entropy(output, target,
                                         reduction='sum').item()

            pred = output.max(1, keepdim=True)[1]
            correct += pred.eq(target.view_as(pred)).sum().item()

    test_loss /= len(test_loader.dataset)
    test_accuracy = 100. * correct / len(test_loader.dataset)
    return test_loss, test_accuracy

EPOCHS = 2

for epoch in range(1, EPOCHS + 1):
    train(model, train_loader, optimizer)
    test_loss, test_accuracy = evaluate(model, test_loader)

    print('[{}] Test Loss: {:.4f}, Accuracy: {:.2f}%'.format(
        epoch, test_loss, test_accuracy))




Downloading http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz to ../.data/MNIST/raw/train-images-idx3-ubyte.gz


100.1%

Extracting ../.data/MNIST/raw/train-images-idx3-ubyte.gz to ../.data/MNIST/raw
Downloading http://yann.lecun.com/exdb/mnist/train-labels-idx1-ubyte.gz to ../.data/MNIST/raw/train-labels-idx1-ubyte.gz


113.5%

Extracting ../.data/MNIST/raw/train-labels-idx1-ubyte.gz to ../.data/MNIST/raw
Downloading http://yann.lecun.com/exdb/mnist/t10k-images-idx3-ubyte.gz to ../.data/MNIST/raw/t10k-images-idx3-ubyte.gz


100.4%

Extracting ../.data/MNIST/raw/t10k-images-idx3-ubyte.gz to ../.data/MNIST/raw
Downloading http://yann.lecun.com/exdb/mnist/t10k-labels-idx1-ubyte.gz to ../.data/MNIST/raw/t10k-labels-idx1-ubyte.gz


180.4%

Extracting ../.data/MNIST/raw/t10k-labels-idx1-ubyte.gz to ../.data/MNIST/raw
Processing...
Done!
> <ipython-input-1-e734efde91ee>(30)forward()
-> h0 = torch.zeros(self.num_layers, x.size(0), self.hidden_size).to(DEVICE)
(Pdb) c


RuntimeError: input must have 3 dimensions, got 4