In [1]:
import torch
import torch.nn as nn
import torch.optim as optim
from torch.utils.data import DataLoader
from torchvision import datasets, transforms
from tqdm.notebook import tqdm

#Loading Data

In [2]:
# Define the transformation for the MNIST dataset
transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))])

# Load the MNIST dataset
train_dataset = datasets.MNIST(root='./data', train=True, transform=transform, download=True)
test_dataset = datasets.MNIST(root='./data', train=False, transform=transform, download=True)

# Create data loaders
train_loader = DataLoader(dataset=train_dataset, batch_size=64, shuffle=True)
test_loader = DataLoader(dataset=test_dataset, batch_size=64, shuffle=False)



Downloading http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz
Downloading http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz to ./data/MNIST/raw/train-images-idx3-ubyte.gz


100%|██████████| 9912422/9912422 [00:00<00:00, 106898495.72it/s]


Extracting ./data/MNIST/raw/train-images-idx3-ubyte.gz to ./data/MNIST/raw

Downloading http://yann.lecun.com/exdb/mnist/train-labels-idx1-ubyte.gz
Downloading http://yann.lecun.com/exdb/mnist/train-labels-idx1-ubyte.gz to ./data/MNIST/raw/train-labels-idx1-ubyte.gz


100%|██████████| 28881/28881 [00:00<00:00, 21944872.07it/s]


Extracting ./data/MNIST/raw/train-labels-idx1-ubyte.gz to ./data/MNIST/raw

Downloading http://yann.lecun.com/exdb/mnist/t10k-images-idx3-ubyte.gz
Downloading http://yann.lecun.com/exdb/mnist/t10k-images-idx3-ubyte.gz to ./data/MNIST/raw/t10k-images-idx3-ubyte.gz


100%|██████████| 1648877/1648877 [00:00<00:00, 16863256.73it/s]


Extracting ./data/MNIST/raw/t10k-images-idx3-ubyte.gz to ./data/MNIST/raw

Downloading http://yann.lecun.com/exdb/mnist/t10k-labels-idx1-ubyte.gz
Downloading http://yann.lecun.com/exdb/mnist/t10k-labels-idx1-ubyte.gz to ./data/MNIST/raw/t10k-labels-idx1-ubyte.gz


100%|██████████| 4542/4542 [00:00<00:00, 18899334.10it/s]


Extracting ./data/MNIST/raw/t10k-labels-idx1-ubyte.gz to ./data/MNIST/raw



# Buliding Model

In [3]:
class Model(nn.Module):
    def __init__(self, input_size, hidden1_size, hidden2_size, output_size):
        super(Model, self).__init__()
        self.flatten = nn.Flatten()
        self.fc1 = nn.Linear(input_size, hidden1_size)
        self.relu = nn.ReLU()
        self.fc2 = nn.Linear(hidden1_size, hidden2_size)
        self.fc3 = nn.Linear(hidden2_size, output_size)

    def forward(self, x):
        x = self.flatten(x)
        x = self.relu(self.fc1(x))
        x = self.relu(self.fc2(x))
        x = self.fc3(x)
        return x

## Training

In [6]:
input_size = 28 * 28
hidden1_size = 128
hidden2_size = 64
output_size = 10
lr = 0.01

# Instantiate the model, loss function, and optimizer
model = Model(input_size, hidden1_size, hidden2_size, output_size)
criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(model.parameters(), lr=lr)


# Training loop
epochs = 10
for epoch in range(epochs):
    total_loss = 0.0
    correct_predictions = 0
    total_samples = 0

    for images, targets in tqdm(train_loader):
        images = images.to(torch.float32)
        targets = targets.to(torch.long)
        optimizer.zero_grad()  # Zero the gradients
        output = model(images)  # Forward pass
        loss = criterion(output, targets)  # Compute the loss
        loss.backward()  # Backward pass
        optimizer.step()  # Update weights

        total_loss += loss.item()

        _, predicted = torch.max(output, 1)
        correct_predictions += (predicted == targets).sum().item()
        total_samples += targets.size(0)

    # Calculate accuracy
    accuracy = correct_predictions / total_samples

    # Print epoch statistics
    print(f"Epoch {epoch + 1}/{epochs}, Loss: {total_loss / len(train_loader)}, Accuracy: {accuracy * 100:.2f}%")

  0%|          | 0/938 [00:00<?, ?it/s]

Epoch 1/10, Loss: 0.9790819118272013, Accuracy: 74.45%


  0%|          | 0/938 [00:00<?, ?it/s]

Epoch 2/10, Loss: 0.37750387390348705, Accuracy: 89.09%


  0%|          | 0/938 [00:00<?, ?it/s]

Epoch 3/10, Loss: 0.32293653594596045, Accuracy: 90.62%


  0%|          | 0/938 [00:00<?, ?it/s]

Epoch 4/10, Loss: 0.2928359089041951, Accuracy: 91.40%


  0%|          | 0/938 [00:00<?, ?it/s]

Epoch 5/10, Loss: 0.2690679029281587, Accuracy: 92.12%


  0%|          | 0/938 [00:00<?, ?it/s]

Epoch 6/10, Loss: 0.248391685610228, Accuracy: 92.75%


  0%|          | 0/938 [00:00<?, ?it/s]

Epoch 7/10, Loss: 0.22865702556188044, Accuracy: 93.32%


  0%|          | 0/938 [00:00<?, ?it/s]

Epoch 8/10, Loss: 0.21032664741772705, Accuracy: 93.84%


  0%|          | 0/938 [00:00<?, ?it/s]

Epoch 9/10, Loss: 0.19453183817726843, Accuracy: 94.36%


  0%|          | 0/938 [00:00<?, ?it/s]

Epoch 10/10, Loss: 0.18080969984486286, Accuracy: 94.74%
