In [1]:
import torch
import torch.nn as nn
import torch.optim as optim
from torchvision import datasets, transforms

In [2]:
# 학습 데아터 로딩
train_loader = torch.utils.data.DataLoader(
    datasets.MNIST('./data2', train=True, download=True,
                  transform=transforms.Compose([
                      transforms.ToTensor(),
                      transforms.Normalize((0.1307,), (0.3081,))
                  ])),
    batch_size=64, shuffle=True)

test_loader = torch.utils.data.DataLoader(
    datasets.MNIST('./data2', train=False, download=True,
    transform=transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.1307,), (0.3081,))
    ])),
    batch_size=1000, shuffle=True)

Downloading http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz
Downloading http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz to ./data2\MNIST\raw\train-images-idx3-ubyte.gz


100%|██████████████████████████████████████████████████████████████████| 9912422/9912422 [00:00<00:00, 30158359.50it/s]


Extracting ./data2\MNIST\raw\train-images-idx3-ubyte.gz to ./data2\MNIST\raw

Downloading http://yann.lecun.com/exdb/mnist/train-labels-idx1-ubyte.gz
Downloading http://yann.lecun.com/exdb/mnist/train-labels-idx1-ubyte.gz to ./data2\MNIST\raw\train-labels-idx1-ubyte.gz


100%|██████████████████████████████████████████████████████████████████████| 28881/28881 [00:00<00:00, 28766491.05it/s]


Extracting ./data2\MNIST\raw\train-labels-idx1-ubyte.gz to ./data2\MNIST\raw

Downloading http://yann.lecun.com/exdb/mnist/t10k-images-idx3-ubyte.gz
Downloading http://yann.lecun.com/exdb/mnist/t10k-images-idx3-ubyte.gz to ./data2\MNIST\raw\t10k-images-idx3-ubyte.gz


100%|██████████████████████████████████████████████████████████████████| 1648877/1648877 [00:00<00:00, 12235253.50it/s]


Extracting ./data2\MNIST\raw\t10k-images-idx3-ubyte.gz to ./data2\MNIST\raw

Downloading http://yann.lecun.com/exdb/mnist/t10k-labels-idx1-ubyte.gz
Downloading http://yann.lecun.com/exdb/mnist/t10k-labels-idx1-ubyte.gz to ./data2\MNIST\raw\t10k-labels-idx1-ubyte.gz


100%|█████████████████████████████████████████████████████████████████████████| 4542/4542 [00:00<00:00, 4607141.18it/s]

Extracting ./data2\MNIST\raw\t10k-labels-idx1-ubyte.gz to ./data2\MNIST\raw






In [3]:
# 모델 정의
class MLP(nn.Module):
    def __init__(self):
        super(MLP, self).__init__()
        self.fc1 = nn.Linear(784, 256)
        self.fc2 = nn.Linear(256, 128)
        self.fc3 = nn.Linear(128, 10)
        
    def forward(self, x):
        x = x.view(-1, 784)
        x = torch.relu(self.fc1(x))
        x = torch.relu(self.fc2(x))
        x = self.fc3(x)
        return x

model = MLP()

# 손실함수 및 최적화 알고리즘 정의
criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(model.parameters(), lr=0.01)

In [4]:
# 학습 실행
for epoch in range(10):
    running_loss = 0.0
    for i, (inputs, labels) in enumerate(train_loader, 0):
        optimizer.zero_grad()
        outputs = model(inputs)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()
        
        running_loss += loss.item()
        if i % 100 == 99:
            print('[%d, %5d] loss: %.3f' % (epoch + 1, i+1, running_loss / 100))
            running_loss = 0.0

[1,   100] loss: 2.151
[1,   200] loss: 1.537
[1,   300] loss: 0.889
[1,   400] loss: 0.622
[1,   500] loss: 0.500
[1,   600] loss: 0.452
[1,   700] loss: 0.416
[1,   800] loss: 0.378
[1,   900] loss: 0.358
[2,   100] loss: 0.345
[2,   200] loss: 0.323
[2,   300] loss: 0.323
[2,   400] loss: 0.313
[2,   500] loss: 0.302
[2,   600] loss: 0.300
[2,   700] loss: 0.283
[2,   800] loss: 0.271
[2,   900] loss: 0.281
[3,   100] loss: 0.268
[3,   200] loss: 0.266
[3,   300] loss: 0.267
[3,   400] loss: 0.241
[3,   500] loss: 0.253
[3,   600] loss: 0.250
[3,   700] loss: 0.226
[3,   800] loss: 0.246
[3,   900] loss: 0.237
[4,   100] loss: 0.237
[4,   200] loss: 0.221
[4,   300] loss: 0.228
[4,   400] loss: 0.209
[4,   500] loss: 0.210
[4,   600] loss: 0.206
[4,   700] loss: 0.214
[4,   800] loss: 0.206
[4,   900] loss: 0.198
[5,   100] loss: 0.185
[5,   200] loss: 0.191
[5,   300] loss: 0.185
[5,   400] loss: 0.189
[5,   500] loss: 0.188
[5,   600] loss: 0.185
[5,   700] loss: 0.181
[5,   800] 

In [5]:
correct = 0
total = 0
with torch.no_grad():
    for inputs, labels in test_loader:
        outputs = model(inputs)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()
        
    print('Accuracy of the network on the 10000 test images: %d %%' % (100 * correct / total))

Accuracy of the network on the 10000 test images: 96 %
