In [1]:
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision
import torchvision.transforms as transforms

# Part 1: Data Loading and Preprocessing

# Download datasets (not necessary as we are using download=True in the next step)

# # Define transformations for data preprocessing
transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.5,), (0.5,))
])

# Load Fashion MNIST dataset
trainset = torchvision.datasets.FashionMNIST(root='./data', train=True, download=True, transform=transform)
testset = torchvision.datasets.FashionMNIST(root='./data', train=False, download=True, transform=transform)

# Create data loaders
trainloader = torch.utils.data.DataLoader(trainset, batch_size=64, shuffle=True)
testloader = torch.utils.data.DataLoader(testset, batch_size=64, shuffle=False)



Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to ./data/FashionMNIST/raw/train-images-idx3-ubyte.gz


  0%|          | 0/26421880 [00:00<?, ?it/s]

Extracting ./data/FashionMNIST/raw/train-images-idx3-ubyte.gz to ./data/FashionMNIST/raw

Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to ./data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


  0%|          | 0/29515 [00:00<?, ?it/s]

Extracting ./data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to ./data/FashionMNIST/raw

Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to ./data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


  0%|          | 0/4422102 [00:00<?, ?it/s]

Extracting ./data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to ./data/FashionMNIST/raw

Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to ./data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz


  0%|          | 0/5148 [00:00<?, ?it/s]

Extracting ./data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to ./data/FashionMNIST/raw



In [2]:
# Part 2: Model Training

# Define the neural network model
class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.fc1 = nn.Linear(784, 256)
        self.fc2 = nn.Linear(256, 128)
        self.fc3 = nn.Linear(128, 10)

    def forward(self, x):
        x = x.view(x.size(0), -1)
        x = torch.relu(self.fc1(x))
        x = torch.relu(self.fc2(x))
        x = self.fc3(x)
        return x

# Create an instance of the model
net = Net()

# Define loss function and optimizer
criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(net.parameters(), lr=0.001, momentum=0.9)

# Train the model
for epoch in range(10):
    running_loss = 0.0
    for i, data in enumerate(trainloader, 0):
        inputs, labels = data

        optimizer.zero_grad()

        outputs = net(inputs)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()

        running_loss += loss.item()
        if i % 200 == 199:
            print(f'Epoch: {epoch + 1}, Batch: {i + 1}, Loss: {running_loss / 200}')
            running_loss = 0.0

print('Training finished.')

Epoch: 1, Batch: 200, Loss: 1.8664700442552566
Epoch: 1, Batch: 400, Loss: 1.0202134603261948
Epoch: 1, Batch: 600, Loss: 0.7619134965538978
Epoch: 1, Batch: 800, Loss: 0.686231083869934
Epoch: 2, Batch: 200, Loss: 0.5972450044751167
Epoch: 2, Batch: 400, Loss: 0.5721162809431553
Epoch: 2, Batch: 600, Loss: 0.5493666070699692
Epoch: 2, Batch: 800, Loss: 0.5387066954374313
Epoch: 3, Batch: 200, Loss: 0.5125240416824818
Epoch: 3, Batch: 400, Loss: 0.4980582490563393
Epoch: 3, Batch: 600, Loss: 0.49226638868451117
Epoch: 3, Batch: 800, Loss: 0.46673306591808794
Epoch: 4, Batch: 200, Loss: 0.45489336386322976
Epoch: 4, Batch: 400, Loss: 0.45928189530968666
Epoch: 4, Batch: 600, Loss: 0.4463480018079281
Epoch: 4, Batch: 800, Loss: 0.44837641626596453
Epoch: 5, Batch: 200, Loss: 0.4347141572088003
Epoch: 5, Batch: 400, Loss: 0.4268411786854267
Epoch: 5, Batch: 600, Loss: 0.42268663972616194
Epoch: 5, Batch: 800, Loss: 0.42576565109193326
Epoch: 6, Batch: 200, Loss: 0.40933271549642086
Epoch:

In [3]:
# Part 3: Model Testing

correct = 0
total = 0
with torch.no_grad():
    for data in testloader:
        images, labels = data
        outputs = net(images)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()

print(f'Accuracy on test set: {(100 * correct / total):.2f}%')


Accuracy on test set: 85.47%
