In [4]:
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision
import torchvision.transforms as transforms

In [6]:
# Define the neural network architecture
class SimpleNN(nn.Module):
    def __init__(self):
        super(SimpleNN, self).__init__()
        self.fc1 = nn.Linear(784, 64)  # Input layer with 64 neurons
        self.fc2 = nn.Linear(64, 64)   # Hidden layer with 64 neurons
        self.fc3 = nn.Linear(64, 10)   # Output layer with 10 neurons (for 10 classes)

    def forward(self, x):
        x = torch.relu(self.fc1(x))   # ReLU activation for the first layer
        x = torch.relu(self.fc2(x))   # ReLU activation for the second layer
        x = self.fc3(x)               # No activation for the output layer
        return x

In [7]:
# Load and preprocess the data
transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.5,), (0.5,))
])

trainset = torchvision.datasets.MNIST(root='./data', train=True, download=True, transform=transform)
trainloader = torch.utils.data.DataLoader(trainset, batch_size=32, shuffle=True)

testset = torchvision.datasets.MNIST(root='./data', train=False, download=True, transform=transform)
testloader = torch.utils.data.DataLoader(testset, batch_size=32, shuffle=False)

In [8]:
# Initialize the model, loss function, and optimizer
model = SimpleNN()
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=0.001)


In [9]:
# Training the model
for epoch in range(10):  # loop over the dataset multiple times
    running_loss = 0.0
    for i, data in enumerate(trainloader, 0):
        inputs, labels = data
        inputs = inputs.view(inputs.shape[0], -1)  # Flatten the input images
        
        # Zero the parameter gradients
        optimizer.zero_grad()

        # Forward + backward + optimize
        outputs = model(inputs)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()

        # Print statistics
        running_loss += loss.item()
        if i % 1000 == 999:  # Print every 1000 mini-batches
            print(f'Epoch {epoch + 1}, Mini-batch {i + 1}: Loss {running_loss / 1000:.3f}')
            running_loss = 0.0

print('Finished Training')

Epoch 1, Mini-batch 1000: Loss 0.472
Epoch 2, Mini-batch 1000: Loss 0.199
Epoch 3, Mini-batch 1000: Loss 0.147
Epoch 4, Mini-batch 1000: Loss 0.118
Epoch 5, Mini-batch 1000: Loss 0.106
Epoch 6, Mini-batch 1000: Loss 0.095
Epoch 7, Mini-batch 1000: Loss 0.085
Epoch 8, Mini-batch 1000: Loss 0.073
Epoch 9, Mini-batch 1000: Loss 0.066
Epoch 10, Mini-batch 1000: Loss 0.063
Finished Training


In [None]:
# Testing the model
correct = 0
total = 0
with torch.no_grad():
    for data in testloader:
        images, labels = data
        images = images.view(images.shape[0], -1)
        outputs = model(images)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()

print(f'Accuracy of the network on the 10000 test images: {100 * correct / total}%')
