In [6]:
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision.transforms as transforms
import torchvision.datasets as datasets
from torch.utils.data import DataLoader
from torchvision import models
import torchvision


In [10]:
# Set random seed for reproducibility
torch.manual_seed(1)

# Define constants
NUM_CLASSES = 37  # OxfordIIITPet dataset has 37 classes
BATCH_SIZE = 128
LEARNING_RATE = 0.0001
NUM_EPOCHS = 15

# Data transformations
transform = transforms.Compose([
    transforms.Resize((224, 224)),
    transforms.ToTensor(),
    transforms.Normalize((0.4904, 0.4550, 0.3984), (0.2630, 0.2585, 0.2665))
])


# Load OxfordIIITPet dataset
train_dataset = torchvision.datasets.OxfordIIITPet(root='/shareddata', download=True,split='trainval',transform=transform)
test_set = torchvision.datasets.OxfordIIITPet(root='/shareddata', download=True,split='test',transform=transform)


# Create data loaders
train_loader = DataLoader(dataset=train_dataset, batch_size=BATCH_SIZE, shuffle=True, num_workers=4)
test_loader = DataLoader(test_set, batch_size=BATCH_SIZE,shuffle=False)

# Check if GPU is available
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")

# Define ResNet model
class ResNetModel(nn.Module):
    def __init__(self, num_classes):
        super(ResNetModel, self).__init__()
        self.resnet = models.resnet18(pretrained=True)
        in_features = self.resnet.fc.in_features
        self.resnet.fc = nn.Linear(in_features, num_classes)

    def forward(self, x):
        return self.resnet(x)

# Create an instance of the model
model = ResNetModel(num_classes=NUM_CLASSES).to(device)

# Define loss function and optimizer
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=LEARNING_RATE)

# Training loop
for epoch in range(NUM_EPOCHS):
    model.train()

    for batch_idx, (data, target) in enumerate(train_loader):
        data, target = data.to(device), target.to(device)

        optimizer.zero_grad()
        output = model(data)
        loss = criterion(output, target)
        loss.backward()
        optimizer.step()

        if batch_idx % 100 == 0:
            print(f"Epoch {epoch+1}/{NUM_EPOCHS}, Batch {batch_idx}/{len(train_loader)}, Loss: {loss.item():.4f}")

# Evaluation
model.eval()
correct = 0
total = 0

with torch.no_grad():
    for data, target in test_loader:
        data, target = data.to(device), target.to(device)
        outputs = model(data)
        _, predicted = torch.max(outputs.data, 1)
        total += target.size(0)
        correct += (predicted == target).sum().item()

accuracy = correct / total
print(f"Test Accuracy: {accuracy * 100:.2f}%")


Epoch 1/15, Batch 0/29, Loss: 3.8062
Epoch 2/15, Batch 0/29, Loss: 1.0034
Epoch 3/15, Batch 0/29, Loss: 0.4653
Epoch 4/15, Batch 0/29, Loss: 0.1932
Epoch 5/15, Batch 0/29, Loss: 0.0896
Epoch 6/15, Batch 0/29, Loss: 0.0557
Epoch 7/15, Batch 0/29, Loss: 0.0370
Epoch 8/15, Batch 0/29, Loss: 0.0273
Epoch 9/15, Batch 0/29, Loss: 0.0201
Epoch 10/15, Batch 0/29, Loss: 0.0152
Epoch 11/15, Batch 0/29, Loss: 0.0134
Epoch 12/15, Batch 0/29, Loss: 0.0109
Epoch 13/15, Batch 0/29, Loss: 0.0091
Epoch 14/15, Batch 0/29, Loss: 0.0092
Epoch 15/15, Batch 0/29, Loss: 0.0074
Test Accuracy: 87.95%
