In [1]:
import torch
import torchvision
import torchvision.transforms as transforms
from torch import nn, optim

# Load the MNIST dataset
transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.5,), (0.5,))
])

trainset = torchvision.datasets.MNIST(root='./data', train=True, download=True, transform=transform)
trainloader = torch.utils.data.DataLoader(trainset, batch_size=64, shuffle=True)

testset = torchvision.datasets.MNIST(root='./data', train=False, download=True, transform=transform)
testloader = torch.utils.data.DataLoader(testset, batch_size=64, shuffle=False)

# Define the Neural Network
class ShallowNN(nn.Module):
    def __init__(self):
        super(ShallowNN, self).__init__()
        self.flatten = nn.Flatten()
        self.fc1 = nn.Linear(28 * 28, 128)
        self.fc2 = nn.Linear(128, 10)

    def forward(self, x):
        x = self.flatten(x)
        x = torch.relu(self.fc1(x))
        x = self.fc2(x)
        return x

# Initialize the network
net = ShallowNN()

# Define a Loss function and Optimizer
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(net.parameters(), lr=0.001)

# Train the Network
for epoch in range(10):  # loop over the dataset multiple times
    running_loss = 0.0
    for i, data in enumerate(trainloader, 0):
        inputs, labels = data

        optimizer.zero_grad()

        outputs = net(inputs)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()

        running_loss += loss.item()
        if i % 100 == 99:    # print every 100 mini-batches
            print(f'[{epoch + 1}, {i + 1:5d}] loss: {running_loss / 100:.3f}')
            running_loss = 0.0

print('Finished Training')

# Test the Network
correct = 0
total = 0
with torch.no_grad():
    for data in testloader:
        images, labels = data
        outputs = net(images)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()

print(f'Accuracy of the network on the 10000 test images: {100 * correct // total} %')

[1,   100] loss: 0.926
[1,   200] loss: 0.422
[1,   300] loss: 0.355
[1,   400] loss: 0.353
[1,   500] loss: 0.349
[1,   600] loss: 0.314
[1,   700] loss: 0.299
[1,   800] loss: 0.281
[1,   900] loss: 0.257
[2,   100] loss: 0.229
[2,   200] loss: 0.232
[2,   300] loss: 0.218
[2,   400] loss: 0.214
[2,   500] loss: 0.188
[2,   600] loss: 0.214
[2,   700] loss: 0.182
[2,   800] loss: 0.183
[2,   900] loss: 0.190
[3,   100] loss: 0.173
[3,   200] loss: 0.152
[3,   300] loss: 0.162
[3,   400] loss: 0.136
[3,   500] loss: 0.140
[3,   600] loss: 0.160
[3,   700] loss: 0.150
[3,   800] loss: 0.128
[3,   900] loss: 0.135
[4,   100] loss: 0.117
[4,   200] loss: 0.123
[4,   300] loss: 0.111
[4,   400] loss: 0.121
[4,   500] loss: 0.114
[4,   600] loss: 0.121
[4,   700] loss: 0.121
[4,   800] loss: 0.106
[4,   900] loss: 0.120
[5,   100] loss: 0.096
[5,   200] loss: 0.097
[5,   300] loss: 0.110
[5,   400] loss: 0.104
[5,   500] loss: 0.100
[5,   600] loss: 0.093
[5,   700] loss: 0.101
[5,   800] 