Question 1

Complete PyTorch Program (MLP for Handwritten Digit Classification)

In [2]:
import torch
import torch.nn as nn
import torch.optim as optim
from torchvision import datasets, transforms
from torch.utils.data import DataLoader

# 1️⃣ Device (CPU / GPU)
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

# 2️⃣ Data Preprocessing (Normalization + Tensor Conversion)
transform = transforms.Compose([
    transforms.ToTensor(),                 # Converts image to tensor [0,1]
    transforms.Normalize((0.5,), (0.5,))   # Normalize to [-1,1]
])

# 3️⃣ Load Handwritten Digit Dataset (MNIST)
train_dataset = datasets.MNIST(
    root='./data', train=True, transform=transform, download=True
)

test_dataset = datasets.MNIST(
    root='./data', train=False, transform=transform, download=True
)

train_loader = DataLoader(train_dataset, batch_size=64, shuffle=True)
test_loader = DataLoader(test_dataset, batch_size=64, shuffle=False)

# 4️⃣ Define Feed-Forward Neural Network (MLP)
class MLP(nn.Module):
    def __init__(self):
        super(MLP, self).__init__()
        self.fc1 = nn.Linear(28 * 28, 128)  # Input layer
        self.relu = nn.ReLU()              # Activation
        self.fc2 = nn.Linear(128, 10)      # Output layer (10 digits)

    def forward(self, x):
        x = self.fc1(x)
        x = self.relu(x)
        x = self.fc2(x)
        return x

# 5️⃣ Initialize Model, Loss, Optimizer
model = MLP().to(device)
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=0.001)

# 6️⃣ Training Loop
num_epochs = 5

for epoch in range(num_epochs):
    model.train()
    total_loss = 0

    for images, labels in train_loader:
        # Flatten images (28x28 → 784)
        images = images.view(images.size(0), -1).to(device)
        labels = labels.to(device)

        outputs = model(images)
        loss = criterion(outputs, labels)

        optimizer.zero_grad()
        loss.backward()
        optimizer.step()

        total_loss += loss.item()

    print(f"Epoch [{epoch+1}/{num_epochs}], Loss: {total_loss/len(train_loader):.4f}")

# 7️⃣ Model Evaluation (Accuracy)
model.eval()
correct = 0
total = 0

with torch.no_grad():
    for images, labels in test_loader:
        images = images.view(images.size(0), -1).to(device)
        labels = labels.to(device)

        outputs = model(images)
        _, predicted = torch.max(outputs, 1)

        total += labels.size(0)
        correct += (predicted == labels).sum().item()

accuracy = 100 * correct / total
print(f"Test Accuracy: {accuracy:.2f}%")

Epoch [1/5], Loss: 0.3828
Epoch [2/5], Loss: 0.2009
Epoch [3/5], Loss: 0.1410
Epoch [4/5], Loss: 0.1124
Epoch [5/5], Loss: 0.0933
Test Accuracy: 96.28%


Question 2

Neural Network Design (MLP in PyTorch)

In [3]:
import torch
import torch.nn as nn

# Define the neural network by inheriting from nn.Module
class DigitMLP(nn.Module):
    def __init__(self, input_size=784, hidden_size=128, num_classes=10):
        super(DigitMLP, self).__init__()

        # Input layer -> Hidden layer
        self.fc1 = nn.Linear(input_size, hidden_size)

        # Activation function
        self.relu = nn.ReLU()

        # Hidden layer -> Output layer
        self.fc2 = nn.Linear(hidden_size, num_classes)

    # Manually implement forward pass
    def forward(self, x):
        x = self.fc1(x)    # Linear transformation (input -> hidden)
        x = self.relu(x)  # ReLU activation
        x = self.fc2(x)   # Linear transformation (hidden -> output)
        return x

# Example: create model instance
model = DigitMLP()
print(model)

DigitMLP(
  (fc1): Linear(in_features=784, out_features=128, bias=True)
  (relu): ReLU()
  (fc2): Linear(in_features=128, out_features=10, bias=True)
)


Question 3

Training & Evaluation Code (PyTorch)

In [4]:
import torch
import torch.nn as nn
import torch.optim as optim

# Assume: model, train_loader, test_loader already defined
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
model = model.to(device)

# 1️⃣ Loss Function & Optimizer
criterion = nn.CrossEntropyLoss()                 # Cross-Entropy Loss for multi-class
optimizer = optim.Adam(model.parameters(), lr=0.001)  # You can use SGD instead

# (Optional) SGD alternative:
# optimizer = optim.SGD(model.parameters(), lr=0.01, momentum=0.9)

# 2️⃣ Training Loop
num_epochs = 5

for epoch in range(num_epochs):
    model.train()   # Set model to training mode
    running_loss = 0.0

    for images, labels in train_loader:
        # Flatten images: (batch, 1, 28, 28) → (batch, 784)
        images = images.view(images.size(0), -1).to(device)
        labels = labels.to(device)

        # Forward pass
        outputs = model(images)
        loss = criterion(outputs, labels)

        # Backward pass and optimization
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()

        running_loss += loss.item()

    avg_loss = running_loss / len(train_loader)
    print(f"Epoch [{epoch+1}/{num_epochs}], Training Loss: {avg_loss:.4f}")

# 3️⃣ Evaluation on Test Dataset
model.eval()   # Set model to evaluation mode
correct = 0
total = 0

with torch.no_grad():
    for images, labels in test_loader:
        images = images.view(images.size(0), -1).to(device)
        labels = labels.to(device)

        outputs = model(images)
        _, predicted = torch.max(outputs, 1)

        total += labels.size(0)
        correct += (predicted == labels).sum().item()

accuracy = 100 * correct / total
print(f"\n✅ Test Classification Accuracy: {accuracy:.2f}%")

Epoch [1/5], Training Loss: 0.3834
Epoch [2/5], Training Loss: 0.2032
Epoch [3/5], Training Loss: 0.1436
Epoch [4/5], Training Loss: 0.1139
Epoch [5/5], Training Loss: 0.0968

✅ Test Classification Accuracy: 96.61%
