In [15]:
import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F

from torchvision import transforms, datasets

In [16]:
USE_CUDA = torch.cuda.is_available()
DEVICE = torch.device('cuda' if USE_CUDA else 'cpu')  

In [17]:
EPOCHS = 40
BATCH_SIZE = 64

In [18]:
train_loader = torch.utils.data.DataLoader(
    datasets.FashionMNIST(
        './data',
        train=True,
        download=True,
        transform=transforms.Compose([
            transforms.ToTensor(),
            transforms.Normalize((0.1307,), (0.3081,))
        ])),
    batch_size=BATCH_SIZE,
    shuffle=True
)

test_loader = torch.utils.data.DataLoader(
    datasets.FashionMNIST(
        './data',
        train=False,
        transform=transforms.Compose([
            transforms.ToTensor(),
            transforms.Normalize((0.1307,), (0.3081,))
        ])),
    batch_size=BATCH_SIZE,
    shuffle=True
)

In [29]:
class CNN(nn.Module):
    def __init__(self):
        super(CNN, self).__init__()
        self.conv1 = nn.Conv2d(1, 10, kernel_size=5)
        self.conv2 = nn.Conv2d(10, 20, kernel_size=5)
        self.drop = nn.Dropout2d()
        self.fc1 = nn.Linear(320, 50)
        self.fc2 = nn.Linear(50, 10)
        
    def forward(self, x):
        x = F.relu(F.max_pool2d(self.conv1(x), 2))
        x = F.relu(F.max_pool2d(self.drop(self.conv2(x)), 2))
        x = x.view(-1, 320)
        x = F.relu(self.fc1(x))
        x = F.dropout(x, training=self.training)
        x = self.fc2(x)
        return F.log_softmax(x, dim=1)

In [34]:
model = CNN().to(DEVICE)
optimizer = optim.SGD(model.parameters(), lr=0.01, momentum=0.5)

In [35]:
def train(model, train_loader, optimizer, epoch):
    model.train()
    for batch_idx, (data, target) in enumerate(train_loader):
        data, target = data.to(DEVICE), target.to(DEVICE)
        optimizer.zero_grad()
        output =  model(data)
        loss = F.cross_entropy(output, target)
        loss.backward()
        optimizer.step()
        
        if batch_idx % 200 == 0:
            print("Train Epoch: {} [{}/{} ({:.0f}%)]\t Loss: {:.6f}"
                 .format(epoch, batch_idx * len(data), len(train_loader.dataset),
                        100. * batch_idx / len(train_loader), loss.item()))

In [36]:
def evaluate(model, test_loader):
    model.eval()
    test_loss = 0
    correct = 0
    
    with torch.no_grad():
        for data, target in test_loader:
            data, target = data.to(DEVICE), target.to(DEVICE)
            output = model(data)
            
            # batch loss aggregate
            test_loss += F.cross_entropy(output, target, reduction='sum').item()
            
            pred = output.max(1, keepdim=True)[1]
            correct += pred.eq(target.view_as(pred)).sum().item()
    
    test_loss /= len(test_loader.dataset)
    test_accuracy = 100. * correct / len(test_loader.dataset)
    return test_loss, test_accuracy

In [37]:
for epoch in range(1, EPOCHS+1):
    train(model, train_loader, optimizer, epoch)
    test_loss, test_accuracy = evaluate(model, test_loader)
    
    print("[{}] Test Loss: {:.4f}, Accuracy: {:.2f}%".format(epoch, test_loss, test_accuracy))

[1] Test Loss: 0.6558, Accuracy: 74.91%
[2] Test Loss: 0.5728, Accuracy: 77.73%
[3] Test Loss: 0.5197, Accuracy: 79.49%
[4] Test Loss: 0.4971, Accuracy: 81.71%
[5] Test Loss: 0.4763, Accuracy: 82.58%
[6] Test Loss: 0.4572, Accuracy: 83.28%
[7] Test Loss: 0.4436, Accuracy: 83.60%
[8] Test Loss: 0.4289, Accuracy: 84.36%
[9] Test Loss: 0.4139, Accuracy: 84.95%
[10] Test Loss: 0.4012, Accuracy: 85.36%
[11] Test Loss: 0.3930, Accuracy: 85.69%
[12] Test Loss: 0.3802, Accuracy: 85.98%
[13] Test Loss: 0.3743, Accuracy: 86.27%
[14] Test Loss: 0.3684, Accuracy: 86.78%
[15] Test Loss: 0.3628, Accuracy: 86.78%
[16] Test Loss: 0.3580, Accuracy: 86.89%
[17] Test Loss: 0.3524, Accuracy: 87.05%
[18] Test Loss: 0.3470, Accuracy: 87.35%
[19] Test Loss: 0.3464, Accuracy: 87.27%
[20] Test Loss: 0.3476, Accuracy: 86.86%
[21] Test Loss: 0.3391, Accuracy: 87.69%
[22] Test Loss: 0.3411, Accuracy: 87.42%
[23] Test Loss: 0.3408, Accuracy: 87.28%
[24] Test Loss: 0.3375, Accuracy: 87.72%
[25] Test Loss: 0.3320, A

[28] Test Loss: 0.3291, Accuracy: 87.77%
[29] Test Loss: 0.3325, Accuracy: 87.86%
[30] Test Loss: 0.3284, Accuracy: 87.80%
[31] Test Loss: 0.3240, Accuracy: 88.18%
[32] Test Loss: 0.3209, Accuracy: 88.28%
[33] Test Loss: 0.3238, Accuracy: 88.26%
[34] Test Loss: 0.3190, Accuracy: 88.49%
[35] Test Loss: 0.3199, Accuracy: 88.39%
[36] Test Loss: 0.3182, Accuracy: 88.42%
[37] Test Loss: 0.3193, Accuracy: 88.10%
[38] Test Loss: 0.3161, Accuracy: 88.17%
[39] Test Loss: 0.3183, Accuracy: 88.23%
[40] Test Loss: 0.3127, Accuracy: 88.57%
