In [None]:
import torch
import torchvision
import torchvision.transforms as transforms
import torch.nn as nn
import torch.optim as optim
from torchvision.models import vgg16

# Define transforms for the dataset
transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.5,), (0.5,))
])

# Load the SVHN dataset
train_dataset = torchvision.datasets.SVHN(root='./data', split='train', transform=transform, download=True)
test_dataset = torchvision.datasets.SVHN(root='./data', split='test', transform=transform, download=True)

# Define data loaders
train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=32, shuffle=True)
test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=32, shuffle=False)

# Load pre-trained VGG16 model
model = vgg16(pretrained=True)

# Modify the fully connected layers for SVHN classification
num_classes = 10  # SVHN has 10 classes (digits 0-9)
model.classifier[6] = nn.Linear(4096, num_classes)

# Freeze convolutional layers (optional)
for param in model.features.parameters():
    param.requires_grad = False

# Define loss function and optimizer
criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(model.parameters(), lr=0.001, momentum=0.9)

# Train the model
num_epochs = 5
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
model.to(device)

for epoch in range(num_epochs):
    running_loss = 0.0
    for i, data in enumerate(train_loader, 0):
        inputs, labels = data[0].to(device), data[1].to(device)
        
        optimizer.zero_grad()
        
        outputs = model(inputs)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()
        
        running_loss += loss.item()
        if i % 100 == 99:    # Print every 100 mini-batches
            print('[%d, %5d] loss: %.3f' %
                  (epoch + 1, i + 1, running_loss / 100))
            running_loss = 0.0

print('Finished Training')

# Evaluate the model
correct = 0
total = 0
with torch.no_grad():
    for data in test_loader:
        images, labels = data[0].to(device), data[1].to(device)
        outputs = model(images)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()

print('Accuracy of the network on the 10000 test images: %d %%' % (
    100 * correct / total))


Using downloaded and verified file: ./data/train_32x32.mat
Using downloaded and verified file: ./data/test_32x32.mat




[1,   100] loss: 2.108
[1,   200] loss: 1.866
[1,   300] loss: 1.836
[1,   400] loss: 1.798
[1,   500] loss: 1.787
[1,   600] loss: 1.758
[1,   700] loss: 1.733
[1,   800] loss: 1.731
[1,   900] loss: 1.705
[1,  1000] loss: 1.660
[1,  1100] loss: 1.674
[1,  1200] loss: 1.642
[1,  1300] loss: 1.665
[1,  1400] loss: 1.614
[1,  1500] loss: 1.602
[1,  1600] loss: 1.613
[1,  1700] loss: 1.592
[1,  1800] loss: 1.618
[1,  1900] loss: 1.648
