<a href="https://colab.research.google.com/github/Ankitkumar1015/pre-trained-models/blob/main/resnet_kaggle_gender.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [None]:
import torch
import torchvision.transforms as transforms
import torchvision.datasets as datasets
from torch.utils.data import DataLoader
import torch.nn as nn
import torchvision.models as models
from torch.optim import lr_scheduler
import torch.optim as optim
import time

In [None]:
# Check for GPU availability
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")


In [None]:
# Define transforms for train and test sets
train_transforms = transforms.Compose([
    transforms.Resize(256),
    transforms.CenterCrop(224),
    transforms.RandomHorizontalFlip(),  # Data augmentation
    transforms.ToTensor(),
    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
])

test_transforms = transforms.Compose([
    transforms.Resize(256),
    transforms.CenterCrop(224),
    transforms.ToTensor(),
    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
])


In [None]:
# Load the datasets
data_dir = '/content/drive/MyDrive/Ml/gender kaggle - Copy'  # Example path from Google Drive
train_dataset = datasets.ImageFolder(root=f'{data_dir}/train', transform=train_transforms)
test_dataset = datasets.ImageFolder(root=f'{data_dir}/test', transform=test_transforms)


In [None]:
# Create data loaders
train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)
test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)


In [None]:
# Load pretrained ResNet model
model = models.resnet18(pretrained=True)


Downloading: "https://download.pytorch.org/models/resnet18-f37072fd.pth" to /root/.cache/torch/hub/checkpoints/resnet18-f37072fd.pth
100%|██████████| 44.7M/44.7M [00:01<00:00, 25.7MB/s]


In [None]:
# Modify the last fully connected layer for binary classification (male/female)
num_ftrs = model.fc.in_features
model.fc = nn.Linear(num_ftrs, 2)  # 2 classes: male, female
model = model.to(device)

In [None]:
# Define loss function and optimizer
criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(model.parameters(), lr=0.001, momentum=0.9)


In [None]:
# Step learning rate decay
scheduler = lr_scheduler.StepLR(optimizer, step_size=7, gamma=0.1)

In [None]:
# Training loop
def train_model(model, criterion, optimizer, scheduler, num_epochs=10):
    since = time.time()

    for epoch in range(num_epochs):
        print(f'Epoch {epoch+1}/{num_epochs}')
        print('-' * 10)

        # Each epoch has a training and evaluation phase
        for phase in ['train', 'val']:
            if phase == 'train':
                model.train()  # Set model to training mode
                dataloader = train_loader
            else:
                model.eval()   # Set model to evaluate mode
                dataloader = test_loader

            running_loss = 0.0
            running_corrects = 0

            # Iterate over data
            for inputs, labels in dataloader:
                inputs = inputs.to(device)
                labels = labels.to(device)

                # Zero the parameter gradients
                optimizer.zero_grad()

                # Forward pass
                with torch.set_grad_enabled(phase == 'train'):
                    outputs = model(inputs)
                    _, preds = torch.max(outputs, 1)
                    loss = criterion(outputs, labels)

                    # Backward pass + optimize only if in training phase
                    if phase == 'train':
                        loss.backward()
                        optimizer.step()

                # Track loss and accuracy
                running_loss += loss.item() * inputs.size(0)
                running_corrects += torch.sum(preds == labels.data)

            # Update learning rate scheduler
            if phase == 'train':
                scheduler.step()

            epoch_loss = running_loss / len(dataloader.dataset)
            epoch_acc = running_corrects.double() / len(dataloader.dataset)

            print(f'{phase} Loss: {epoch_loss:.4f} Acc: {epoch_acc:.4f}')

    time_elapsed = time.time() - since
    print(f'Training complete in {time_elapsed // 60:.0f}m {time_elapsed % 60:.0f}s')

# Train the model
train_model(model, criterion, optimizer, scheduler, num_epochs=10)


Epoch 1/10
----------
train Loss: 0.2783 Acc: 0.8857
val Loss: 0.2856 Acc: 0.8750
Epoch 2/10
----------
train Loss: 0.1347 Acc: 0.9573
val Loss: 0.2215 Acc: 0.8917
Epoch 3/10
----------
train Loss: 0.0866 Acc: 0.9718
val Loss: 0.2032 Acc: 0.9250
Epoch 4/10
----------
train Loss: 0.0793 Acc: 0.9761
val Loss: 0.1712 Acc: 0.9417
Epoch 5/10
----------
train Loss: 0.0358 Acc: 0.9923
val Loss: 0.1659 Acc: 0.9333
Epoch 6/10
----------
train Loss: 0.0300 Acc: 0.9949
val Loss: 0.1612 Acc: 0.9333
Epoch 7/10
----------
train Loss: 0.0259 Acc: 0.9957
val Loss: 0.1573 Acc: 0.9417
Epoch 8/10
----------
train Loss: 0.0188 Acc: 0.9974
val Loss: 0.1543 Acc: 0.9417
Epoch 9/10
----------
train Loss: 0.0167 Acc: 0.9983
val Loss: 0.1458 Acc: 0.9417
Epoch 10/10
----------
train Loss: 0.0202 Acc: 0.9983
val Loss: 0.1426 Acc: 0.9500
Training complete in 67m 3s


In [None]:
# Evaluate model accuracy on test set
model.eval()  # Set model to evaluation mode

correct = 0
total = 0

with torch.no_grad():  # No need to calculate gradients for evaluation
    for images, labels in test_loader:
        images, labels = images.to(device), labels.to(device)

        # Forward pass
        outputs = model(images)
        _, predicted = torch.max(outputs.data, 1)

        total += labels.size(0)
        correct += (predicted == labels).sum().item()

# Calculate accuracy
accuracy = 100 * correct / total
print(f'Test Accuracy: {accuracy:.2f}%')

Test Accuracy: 95.00%
