In [2]:
import os
import torch
import torch.nn as nn
import torch.optim as optim
from torchvision import datasets, transforms
from torch.utils.data import DataLoader
from tqdm import tqdm
from sklearn.metrics import roc_curve
import pandas as pd
# from apex import amp  # for mixed precision training
from torchvision import models

In [3]:
# Define transforms for data augmentation and normalization
data_transforms = {
    'train': transforms.Compose([
        transforms.RandomResizedCrop(224),
        transforms.RandomHorizontalFlip(),
        transforms.ToTensor(),
        transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
    ]),
    'val': transforms.Compose([
        transforms.Resize(256),
        transforms.CenterCrop(224),
        transforms.ToTensor(),
        transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
    ]),
    'test': transforms.Compose([
        transforms.Resize(256),
        transforms.CenterCrop(224),
        transforms.ToTensor(),
        transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
    ]),
}

In [4]:
# Set the paths to your training and validation directories
train_dir = '/kaggle/input/morph-splitted/train'
val_dir = '/kaggle/input/morph-splitted/val'
test_dir = '/kaggle/input/morph-splitted/test'

In [5]:
image_datasets = {
    'train': datasets.ImageFolder(train_dir, data_transforms['train']),
    'val': datasets.ImageFolder(val_dir, data_transforms['val']),
    'test': datasets.ImageFolder(test_dir, data_transforms['test'])
}


In [6]:
# Create data loaders
dataloaders = {
    'train': DataLoader(image_datasets['train'], batch_size=32, shuffle=True, num_workers=4),
    'val': DataLoader(image_datasets['val'], batch_size=32, shuffle=False, num_workers=4),
    'test': DataLoader(image_datasets['test'], batch_size=32, shuffle=False, num_workers=4)
}


In [7]:
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")

In [8]:
# Define DenseNet model for binary classification
class DenseNetBinary(nn.Module):
    def __init__(self):
        super(DenseNetBinary, self).__init__()
        self.model = models.densenet121(pretrained=True)
        num_ftrs = self.model.classifier.in_features
        self.model.classifier = nn.Linear(num_ftrs, 1)  # Output layer with 1 neuron for binary classification
    
    def forward(self, x):
        return self.model(x)

# Initialize the model
model = DenseNetBinary().to(device)
criterion = nn.BCEWithLogitsLoss()  # Binary cross-entropy loss
optimizer = optim.Adam(model.parameters(), lr=0.001)  # Only train the classifier


Downloading: "https://download.pytorch.org/models/densenet121-a639ec97.pth" to /root/.cache/torch/hub/checkpoints/densenet121-a639ec97.pth
100%|██████████| 30.8M/30.8M [00:00<00:00, 129MB/s] 


In [9]:
num_epochs = 10
best_model_wts = model.state_dict()
best_acc = 0.0
dataset_sizes = {x: len(image_datasets[x]) for x in ['train', 'val']}


In [10]:
# Training loop
for epoch in range(num_epochs):
    print(f'Epoch {epoch+1}/{num_epochs}')
    print('-' * 10)

    # Each epoch has a training and validation phase
    for phase in ['train', 'val']:
        if phase == 'train':
            model.train()  # Set model to training mode
        else:
            model.eval()  # Set model to evaluate mode

        running_loss = 0.0
        running_corrects = 0

        # Iterate over data with progress bar
        with tqdm(total=len(dataloaders[phase]), desc=f'{phase} Phase', unit='batch') as pbar:
            for i, (inputs, labels) in enumerate(dataloaders[phase]):
                inputs = inputs.to(device)
                labels = labels.to(device)

                # Zero the parameter gradients
                optimizer.zero_grad()

                # Forward pass
                with torch.set_grad_enabled(phase == 'train'):
                    outputs = model(inputs)
                    preds = torch.sigmoid(outputs).round()
                    loss = criterion(outputs, labels.unsqueeze(1).float())

                    # Backward pass and optimize only if in training phase
                    if phase == 'train':
                        loss.backward()
                        optimizer.step()

                # Statistics
                running_loss += loss.item() * inputs.size(0)
                running_corrects += torch.sum(preds == labels.unsqueeze(1))

                # Update progress bar
                pbar.update(1)
                pbar.set_postfix(loss=running_loss / ((pbar.n + 1) * inputs.size(0)),
                                 accuracy=running_corrects.double() / ((pbar.n + 1) * inputs.size(0)))

        epoch_loss = running_loss / dataset_sizes[phase]
        epoch_acc = running_corrects.double() / dataset_sizes[phase]

        print(f'{phase} Loss: {epoch_loss:.4f} Acc: {epoch_acc:.4f}')

        # Deep copy the model
        if phase == 'val' and epoch_acc > best_acc:
            best_acc = epoch_acc
            best_model_wts = model.state_dict()

    print()

# Load best model weights
model.load_state_dict(best_model_wts)
print('Best val Acc: {:4f}'.format(best_acc))


Epoch 1/10
----------


train Phase: 100%|██████████| 750/750 [02:24<00:00,  5.21batch/s, accuracy=tensor(0.9744, device='cuda:0', dtype=torch.float64), loss=0.0633]


train Loss: 0.0634 Acc: 0.9757


val Phase: 100%|██████████| 250/250 [00:23<00:00, 10.52batch/s, accuracy=tensor(0.9701, device='cuda:0', dtype=torch.float64), loss=0.0767] 


val Loss: 0.0770 Acc: 0.9740

Epoch 2/10
----------


train Phase: 100%|██████████| 750/750 [02:23<00:00,  5.22batch/s, accuracy=tensor(0.9857, device='cuda:0', dtype=torch.float64), loss=0.0369]


train Loss: 0.0370 Acc: 0.9870


val Phase: 100%|██████████| 250/250 [00:18<00:00, 13.58batch/s, accuracy=tensor(0.9801, device='cuda:0', dtype=torch.float64), loss=0.044]  


val Loss: 0.0442 Acc: 0.9840

Epoch 3/10
----------


train Phase: 100%|██████████| 750/750 [02:24<00:00,  5.21batch/s, accuracy=tensor(0.9882, device='cuda:0', dtype=torch.float64), loss=0.0279]


train Loss: 0.0279 Acc: 0.9895


val Phase: 100%|██████████| 250/250 [00:18<00:00, 13.55batch/s, accuracy=tensor(0.9795, device='cuda:0', dtype=torch.float64), loss=0.0455] 


val Loss: 0.0457 Acc: 0.9834

Epoch 4/10
----------


train Phase: 100%|██████████| 750/750 [02:24<00:00,  5.21batch/s, accuracy=tensor(0.9900, device='cuda:0', dtype=torch.float64), loss=0.0248]


train Loss: 0.0249 Acc: 0.9913


val Phase: 100%|██████████| 250/250 [00:18<00:00, 13.55batch/s, accuracy=tensor(0.9950, device='cuda:0', dtype=torch.float64), loss=0.00268] 


val Loss: 0.0027 Acc: 0.9990

Epoch 5/10
----------


train Phase: 100%|██████████| 750/750 [02:23<00:00,  5.21batch/s, accuracy=tensor(0.9897, device='cuda:0', dtype=torch.float64), loss=0.0256]


train Loss: 0.0256 Acc: 0.9910


val Phase: 100%|██████████| 250/250 [00:18<00:00, 13.49batch/s, accuracy=tensor(0.9953, device='cuda:0', dtype=torch.float64), loss=0.00147] 


val Loss: 0.0015 Acc: 0.9992

Epoch 6/10
----------


train Phase: 100%|██████████| 750/750 [02:23<00:00,  5.22batch/s, accuracy=tensor(0.9910, device='cuda:0', dtype=torch.float64), loss=0.0217]


train Loss: 0.0217 Acc: 0.9923


val Phase: 100%|██████████| 250/250 [00:18<00:00, 13.55batch/s, accuracy=tensor(0.9268, device='cuda:0', dtype=torch.float64), loss=0.227]  


val Loss: 0.2276 Acc: 0.9305

Epoch 7/10
----------


train Phase: 100%|██████████| 750/750 [02:23<00:00,  5.24batch/s, accuracy=tensor(0.9913, device='cuda:0', dtype=torch.float64), loss=0.0207]


train Loss: 0.0208 Acc: 0.9926


val Phase: 100%|██████████| 250/250 [00:18<00:00, 13.54batch/s, accuracy=tensor(0.9935, device='cuda:0', dtype=torch.float64), loss=0.00724] 


val Loss: 0.0073 Acc: 0.9975

Epoch 8/10
----------


train Phase: 100%|██████████| 750/750 [02:23<00:00,  5.23batch/s, accuracy=tensor(0.9928, device='cuda:0', dtype=torch.float64), loss=0.0167]


train Loss: 0.0168 Acc: 0.9941


val Phase: 100%|██████████| 250/250 [00:18<00:00, 13.65batch/s, accuracy=tensor(0.9894, device='cuda:0', dtype=torch.float64), loss=0.0173]  


val Loss: 0.0174 Acc: 0.9934

Epoch 9/10
----------


train Phase: 100%|██████████| 750/750 [02:22<00:00,  5.25batch/s, accuracy=tensor(0.9933, device='cuda:0', dtype=torch.float64), loss=0.0137] 


train Loss: 0.0137 Acc: 0.9947


val Phase: 100%|██████████| 250/250 [00:18<00:00, 13.81batch/s, accuracy=tensor(0.9934, device='cuda:0', dtype=torch.float64), loss=0.00665] 


val Loss: 0.0067 Acc: 0.9974

Epoch 10/10
----------


train Phase: 100%|██████████| 750/750 [02:23<00:00,  5.22batch/s, accuracy=tensor(0.9934, device='cuda:0', dtype=torch.float64), loss=0.0149] 


train Loss: 0.0150 Acc: 0.9947


val Phase: 100%|██████████| 250/250 [00:18<00:00, 13.79batch/s, accuracy=tensor(0.9854, device='cuda:0', dtype=torch.float64), loss=0.0303]  

val Loss: 0.0304 Acc: 0.9894

Best val Acc: 0.999250





In [12]:
# Test the model
model.eval()
running_loss = 0.0
running_corrects = 0

with torch.no_grad():
    for inputs, labels in dataloaders['test']:
        inputs = inputs.to(device)
        labels = labels.float().view(-1, 1).to(device)

        outputs = model(inputs)
        preds = torch.sigmoid(outputs) > 0.5
        loss = criterion(outputs, labels)

        running_loss += loss.item() * inputs.size(0)
        running_corrects += torch.sum(preds == labels.data)

test_loss = running_loss / len(image_datasets['test'])
test_acc = running_corrects.double() / len(image_datasets['test'])

print(f'Test Loss: {test_loss:.4f} Acc: {test_acc:.4f}')


Test Loss: 0.0331 Acc: 0.9895


In [13]:
import torch
from torch.utils.data import DataLoader

# Function to create data loaders
def create_data_loader(data_dir, transform, batch_size):
    dataset = datasets.ImageFolder(data_dir, transform)
    data_loader = DataLoader(dataset, batch_size=batch_size, shuffle=False, num_workers=4)
    return data_loader

# Define the transforms for the datasets
transform = transforms.Compose([
    transforms.Resize(256),
    transforms.CenterCrop(224),
    transforms.ToTensor(),
    transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
])

batch_size = 16

# Create data loaders for each dataset
fm_loader = create_data_loader('/kaggle/input/mad-benchmark/FaceMorpher', transform, batch_size)
mg1_loader = create_data_loader('/kaggle/input/mad-benchmark/MIPGAN_I', transform, batch_size)
mg2_loader = create_data_loader('/kaggle/input/mad-benchmark/MIPGAN_II', transform, batch_size)
oc_loader = create_data_loader('/kaggle/input/mad-benchmark/OpenCV', transform, batch_size)
wm_loader = create_data_loader('/kaggle/input/mad-benchmark/Webmorph', transform, batch_size)


In [14]:
data_loaders = [fm_loader, mg1_loader, mg2_loader, oc_loader, wm_loader]
results = []
losses = []

# Evaluate the model on each dataset
criterion = nn.BCEWithLogitsLoss()
model.eval()

DenseNetBinary(
  (model): DenseNet(
    (features): Sequential(
      (conv0): Conv2d(3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)
      (norm0): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (relu0): ReLU(inplace=True)
      (pool0): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)
      (denseblock1): _DenseBlock(
        (denselayer1): _DenseLayer(
          (norm1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (relu1): ReLU(inplace=True)
          (conv1): Conv2d(64, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (norm2): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (relu2): ReLU(inplace=True)
          (conv2): Conv2d(128, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
        )
        (denselayer2): _DenseLayer(
          (norm1): BatchNorm2d(96, eps=1e-05, momentu

In [15]:
for loader_idx, data_loader in enumerate(data_loaders):
    running_loss = 0.0
    running_corrects = 0
    total_samples = 0

    dataset_name = ["FaceMorpher", "MIPGAN_I", "MIPGAN_II", "OpenCV", "Webmorph"][loader_idx]
    print(f"Evaluating dataset: {dataset_name}")

    for inputs, labels in tqdm(data_loader, desc=f"Processing {dataset_name}", leave=False):
        inputs = inputs.to(device)
        labels = labels.float().view(-1, 1).to(device)

        outputs = model(inputs)
        preds = torch.sigmoid(outputs) > 0.5
        loss = criterion(outputs, labels)

        running_loss += loss.item() * inputs.size(0)
        running_corrects += torch.sum(preds == labels.data)
        total_samples += inputs.size(0)

    test_loss = running_loss / total_samples
    test_accuracy = running_corrects.double() / total_samples

    results.append(test_accuracy.item())
    losses.append(test_loss)

    print(f"{dataset_name} - Loss: {test_loss:.4f} Acc: {test_accuracy:.4f}")

# Print the final results
print("\nFinal Results:")
names = ["FaceMorpher", "MIPGAN_I", "MIPGAN_II", "OpenCV", "Webmorph"]
for name, accuracy in zip(names, results):
    print(f"{name}: {accuracy:.4f}")


Evaluating dataset: FaceMorpher


                                                                       

FaceMorpher - Loss: 1.6577 Acc: 0.6578
Evaluating dataset: MIPGAN_I


                                                                    

MIPGAN_I - Loss: 2.5322 Acc: 0.4684
Evaluating dataset: MIPGAN_II


                                                                     

MIPGAN_II - Loss: 2.2831 Acc: 0.4888
Evaluating dataset: OpenCV


                                                                  

OpenCV - Loss: 8.4672 Acc: 0.1742
Evaluating dataset: Webmorph


                                                                    

Webmorph - Loss: 9.5318 Acc: 0.2898

Final Results:
FaceMorpher: 0.6578
MIPGAN_I: 0.4684
MIPGAN_II: 0.4888
OpenCV: 0.1742
Webmorph: 0.2898




### **Evaluation Metrics**

In [16]:
import torch
import numpy as np
import pandas as pd
from sklearn.metrics import roc_curve

def calculate_apcer(true_labels, predictions, fixed_bpcer):
    """Calculate APCER at a fixed BPCER."""
    fpr, tpr, thresholds = roc_curve(true_labels, predictions, pos_label=1)
    fpr_target = fixed_bpcer
    closest_fpr_index = np.argmin(np.abs(fpr - fpr_target))
    apcer = 1 - tpr[closest_fpr_index]
    return apcer

def calculate_bpcer(true_labels, predictions, fixed_apcer):
    """Calculate BPCER at a fixed APCER."""
    fpr, tpr, thresholds = roc_curve(true_labels, predictions, pos_label=1)
    tpr_target = 1 - fixed_apcer
    closest_tpr_index = np.argmin(np.abs(tpr - tpr_target))
    bpcer = fpr[closest_tpr_index]
    return bpcer

def calculate_eer(true_labels, predictions):
    """Calculate EER."""
    fpr, tpr, thresholds = roc_curve(true_labels, predictions, pos_label=1)
    frr = 1 - tpr
    eer_index = np.argmin(np.abs(fpr - frr))
    eer = fpr[eer_index]
    return eer

# Define datasets and model predictions
datasets = [fm_loader, mg1_loader, mg2_loader, oc_loader, wm_loader]
names = ["FaceMorpher", "MIPGAN_I", "MIPGAN_II", "OpenCV", "Webmorph"]
fixed_bpcer_values = [0.01, 0.1, 0.2]
fixed_apcer_values = [0.01, 0.1, 0.2]
all_results = []

# Move the model to the GPU if available
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
model.to(device)
model.eval()  # Ensure the model is in evaluation mode

# Iterate over each dataset
for dataset, name in zip(datasets, names):
    print(f"Evaluating model on dataset: {name}")
    
    # Predictions and true labels
    all_predictions = []
    all_true_labels = []
    for inputs, labels in dataset:
        inputs, labels = inputs.to(device), labels.to(device)  # Move data to the GPU
        with torch.no_grad():  # Disable gradient computation
            predictions = model(inputs)
        all_predictions.append(predictions.detach().cpu().numpy())
        all_true_labels.append(labels.cpu().numpy())
    predictions = np.concatenate(all_predictions)
    true_labels = np.concatenate(all_true_labels)

    # Calculate metrics for each fixed BPCER
    for fixed_bpcer in fixed_bpcer_values:
        print(f"Calculating metrics for fixed BPCER: {fixed_bpcer}")
        apcer = calculate_apcer(true_labels, predictions, fixed_bpcer)
        result = {
            "Dataset": name,
            "Fixed BPCER": f"{fixed_bpcer * 100:.1f}%",
            "APCER": apcer
        }
        all_results.append(result)
    
    # Calculate metrics for each fixed APCER
    for fixed_apcer in fixed_apcer_values:
        print(f"Calculating metrics for fixed APCER: {fixed_apcer}")
        bpcer = calculate_bpcer(true_labels, predictions, fixed_apcer)
        result = {
            "Dataset": name,
            "Fixed APCER": f"{fixed_apcer * 100:.1f}%",
            "BPCER": bpcer
        }
        all_results.append(result)

    # Calculate EER
    eer = calculate_eer(true_labels, predictions)
    result = {
        "Dataset": name,
        "EER": eer
    }
    all_results.append(result)

# Convert the results to a Pandas DataFrame
df_results = pd.DataFrame(all_results)

# Display the DataFrame
print(df_results)


Evaluating model on dataset: FaceMorpher
Calculating metrics for fixed BPCER: 0.01
Calculating metrics for fixed BPCER: 0.1
Calculating metrics for fixed BPCER: 0.2
Calculating metrics for fixed APCER: 0.01
Calculating metrics for fixed APCER: 0.1
Calculating metrics for fixed APCER: 0.2
Evaluating model on dataset: MIPGAN_I
Calculating metrics for fixed BPCER: 0.01
Calculating metrics for fixed BPCER: 0.1
Calculating metrics for fixed BPCER: 0.2
Calculating metrics for fixed APCER: 0.01
Calculating metrics for fixed APCER: 0.1
Calculating metrics for fixed APCER: 0.2
Evaluating model on dataset: MIPGAN_II
Calculating metrics for fixed BPCER: 0.01
Calculating metrics for fixed BPCER: 0.1
Calculating metrics for fixed BPCER: 0.2
Calculating metrics for fixed APCER: 0.01
Calculating metrics for fixed APCER: 0.1
Calculating metrics for fixed APCER: 0.2
Evaluating model on dataset: OpenCV
Calculating metrics for fixed BPCER: 0.01
Calculating metrics for fixed BPCER: 0.1
Calculating metrics