In [22]:
from torchvision import transforms, datasets
from torch.utils.data import DataLoader, random_split
import torchvision.models as models
import torch.nn as nn


In [23]:
from torchvision import datasets, transforms
from torch.utils.data import Dataset, DataLoader
import os
from PIL import Image
import tqdm


class CatNotCatDataset(Dataset):
    def __init__(self, root_dir, transform=None):
        """
        Args:
            root_dir (string): Directory with all the animal subdirectories.
            transform (callable, optional): Optional transform to be applied on a sample.
        """
        self.root_dir = root_dir
        self.transform = transform
        self.samples = []

        # Separate handling for 'cat' and 'not cat' images
        for sub_dir in os.listdir(root_dir):
            class_path = os.path.join(root_dir, sub_dir)
            if os.path.isdir(class_path):
                # Label 1 for cat, 0 for not cat
                label = 1 if sub_dir.lower() == 'cat' else 0
                # If 'not cat', traverse further into subdirectories
                if label == 0:
                    for sub_class in os.listdir(class_path):
                        sub_class_path = os.path.join(class_path, sub_class)
                        if os.path.isdir(sub_class_path):
                            for img_file in os.listdir(sub_class_path):
                                if img_file.lower().endswith(('png', 'jpg', 'jpeg')):
                                    img_path = os.path.join(sub_class_path, img_file)
                                    self.samples.append((img_path, label))
                else:
                    for img_file in os.listdir(class_path):
                        if img_file.lower().endswith(('png', 'jpg', 'jpeg')):
                            img_path = os.path.join(class_path, img_file)
                            self.samples.append((img_path, label))

    def __len__(self):
        return len(self.samples)

    def __getitem__(self, idx):
        img_path, label = self.samples[idx]
        image = Image.open(img_path)
        if self.transform:
            image = self.transform(image)
        return image, label


In [24]:
transform = transforms.Compose([
    transforms.Resize((224, 224)),  # Resize images to 224x224
    transforms.ToTensor(),  # Convert images to PyTorch tensors
    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),  # ImageNet normalization
])

dataset = CatNotCatDataset(root_dir='one_vs_rest', transform=transform)

# Splitting dataset into training and validation sets
train_size = int(0.8 * len(dataset))
val_size = len(dataset) - train_size
train_dataset, val_dataset = random_split(dataset, [train_size, val_size])

# Creating data loaders
train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)
val_loader = DataLoader(val_dataset, batch_size=32, shuffle=False)

In [25]:
import torch
import torch.nn as nn
import torch.nn.functional as F

class ResNet18CatNotCat(nn.Module):
    def __init__(self, num_classes=2):
        super(ResNet18CatNotCat, self).__init__()
        # Load a pre-trained resnet model
        self.resnet18 = models.resnet18(pretrained=True)
        # Modify the final fully connected layer to match the number of classes
        num_ftrs = self.resnet18.fc.in_features
        self.resnet18.fc = nn.Linear(num_ftrs, num_classes)
        
    def forward(self, x):
        # Forward pass through ResNet-18
        x = self.resnet18(x)
        return x


In [26]:
import matplotlib.pyplot as plt

def visualize_feature_maps(feature_maps):
    # Assuming feature_maps is a list of tensors from the convolutional layers
    for layer, f_map in enumerate(feature_maps):
        layer += 1  # Start layer indexing at 1
        plt.figure(figsize=(20, 15))
        channels = f_map.shape[1]
        
        for i in range(channels):
            plt.subplot(channels // 8 + 1, 8, i + 1)  # Arrange plots in a grid
            plt.imshow(f_map[0, i].detach().cpu().numpy(), cmap='gray')
            plt.axis('off')
        
        plt.show()


In [27]:
def train_model(model, train_loader, val_loader, num_epochs=5):
    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
    
    model.to(device)
    criterion = nn.CrossEntropyLoss()
    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)
    for epoch in tqdm.tqdm(range(num_epochs)):
        model.train()
        running_loss = 0.0
        for images, labels in tqdm.tqdm(train_loader):
            images, labels = images.to(device), labels.to(device)
            optimizer.zero_grad()
    
            outputs = model(images)  # Only get the final output, no conv_outputs
            loss = criterion(outputs, labels)
            loss.backward()
            optimizer.step()
            running_loss += loss.item()
    

            
            # Example of how to print the shape of each conv layer output
            #for i, conv_output in enumerate(conv_outputs):
               # print(f"Shape of output from Conv Layer {i+1}: {conv_output.shape}")
        
        model.eval()
        val_loss = 0.0
        correct = 0
        total = 0
        with torch.no_grad():
            for images, labels in val_loader:
                images, labels = images.to(device), labels.to(device)
                outputs = model(images)  # Adjusted to only expect the final output
                loss = criterion(outputs, labels)
                val_loss += loss.item()
                _, predicted = torch.max(outputs.data, 1)
                total += labels.size(0)
                correct += (predicted == labels).sum().item()


        print(f'Epoch {epoch+1}, Loss: {running_loss / len(train_loader)}, Validation Loss: {val_loss / len(val_loader)}, Accuracy: {100 * correct / total}%')

    print('Finished Training')
    
model = ResNet18CatNotCat()
train_model(model, train_loader, val_loader, num_epochs=10)

  0%|          | 0/10 [00:00<?, ?it/s]