In [1]:
!pip install pytorch-lightning

Collecting pytorch-lightning
  Downloading pytorch_lightning-2.5.5-py3-none-any.whl.metadata (20 kB)
Collecting torchmetrics>0.7.0 (from pytorch-lightning)
  Downloading torchmetrics-1.8.2-py3-none-any.whl.metadata (22 kB)
Collecting lightning-utilities>=0.10.0 (from pytorch-lightning)
  Downloading lightning_utilities-0.15.2-py3-none-any.whl.metadata (5.7 kB)
Downloading pytorch_lightning-2.5.5-py3-none-any.whl (832 kB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m832.4/832.4 kB[0m [31m19.5 MB/s[0m eta [36m0:00:00[0m
[?25hDownloading lightning_utilities-0.15.2-py3-none-any.whl (29 kB)
Downloading torchmetrics-1.8.2-py3-none-any.whl (983 kB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m983.2/983.2 kB[0m [31m46.4 MB/s[0m eta [36m0:00:00[0m
[?25hInstalling collected packages: lightning-utilities, torchmetrics, pytorch-lightning
Successfully installed lightning-utilities-0.15.2 pytorch-lightning-2.5.5 torchmetrics-1.8.2


In [2]:
import sys
import os

def is_colab_env():
    return "google.colab" in sys.modules

def mount_google_drive(drive_dir="/content/drive/", repo_dir="MyDrive/repositories/deepfake-detection"):
    # mount google drive
    from google.colab import drive
    drive.mount(drive_dir)

    # change to correct working directory
    import os
    os.chdir(f"{drive_dir}{repo_dir}")
    print(os.listdir()) # verify content

def resolve_path(levels_deep=3):
    if is_colab_env():
        mount_google_drive()
    else:
        # Get the directory of the current script
        current_dir = os.path.dirname(os.path.abspath('__file__'))

        # Construct the path to the parent directory
        for i in range(levels_deep):
            current_dir = os.path.dirname(current_dir)

        # Add the parent directory to sys.path
        sys.path.append(current_dir)
        print(sys.path)

resolve_path()

Mounted at /content/drive/
['src', '.git', 'config.py', 'playground', 'reports', '__pycache__', 'setup', '.gitignore', 'train.py', 'README.md', 'environment2.yml', 'environment.yml', 'run_jupyter.sh']


In [3]:
# import local config
import config

In [4]:
# import library dependencies
import io
from itertools import islice
import matplotlib.pyplot as plt
import numpy as np

# image processing
import cv2
from PIL import Image

In [5]:
# pytorch
import torch
import pytorch_lightning as L

In [6]:
# import local dependencies
# from src.adapters.datasets.wilddeepfake import WildDeepfakeDataModule
from src.adapters.datasets.sida import SidADataModule
from src.models.freqnet import LitFreqNet

In [7]:
model_id = "frequency_freqnet"
model_checkpoint_dir = f"{config.CHECKPOINTS_DIR}/{model_id}"

In [8]:
from torchvision import transforms

# --- common normalization (ImageNet) ---
imagenet_normalize = transforms.Normalize(
    mean=[0.485, 0.456, 0.406],
    std=[0.229, 0.224, 0.225]
)

# --- training transform ---
train_transform = transforms.Compose([
    transforms.Resize((256, 256)),        # resize frame
    transforms.Lambda(lambda img: img.convert("RGB")),  # force RGB
    transforms.RandomHorizontalFlip(),    # flip for augmentation
    transforms.ColorJitter(               # optional: color variation
        brightness=0.2, contrast=0.2, saturation=0.2, hue=0.1
    ),
    transforms.ToTensor(),
    imagenet_normalize,
])

# --- validation transform ---
val_transform = transforms.Compose([
    transforms.Resize((256, 256)),  # deterministic resize
    transforms.Lambda(lambda img: img.convert("RGB")),
    transforms.ToTensor(),
    imagenet_normalize,
])

# --- test transform (usually same as val) ---
test_transform = transforms.Compose([
    transforms.Resize((256, 256)),
    transforms.Lambda(lambda img: img.convert("RGB")),
    transforms.ToTensor(),
    imagenet_normalize,
])

transforms = {
    "train": train_transform,
    "val": val_transform,
    "test": test_transform
}

In [9]:
# Set seeds for reproducibility
seed = config.SEED

torch.manual_seed(seed)
np.random.seed(seed)

# Determine device (GPU or CPU)
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
print(f"Using device: {device}")

Using device: cpu


In [10]:
dataset_name = "xingjunm/WildDeepfake"
max_samples = 900_000  # For quick development, remove for full dataset
batch_size = 16
num_workers = 0
max_epochs = 20

# define datamodule
# wilddeepfake_data_module = WildDeepfakeDataModule(
#     dataset_name=dataset_name,
#     batch_size=batch_size,
#     num_workers=num_workers,
#     max_samples=max_samples,
#     seed=seed,
#     transforms=DEFAULT_DATA_TRANSFORMS,
#     additional_transforms=ela
# )
from src.adapters.datasets.wilddeepfake import load_streaming_dataset, create_data_loaders
datasets = load_streaming_dataset(
    dataset_name,
    max_samples=max_samples,
    seed=seed
)
train_loader, val_loader, test_loader = create_data_loaders(
    datasets,
    batch_size=batch_size,
    num_workers=num_workers,
    transforms=transforms,
    # additional_transforms=ela
)

Loading streaming dataset: xingjunm/WildDeepfake


README.md:   0%|          | 0.00/31.0 [00:00<?, ?B/s]

Resolving data files:   0%|          | 0/963 [00:00<?, ?it/s]

Resolving data files:   0%|          | 0/157 [00:00<?, ?it/s]

In [11]:
# define early stopper
early_stop_callback = L.callbacks.EarlyStopping(
    monitor="val_loss",       # metric to track
    patience=3,               # epochs to wait for improvement
    mode="min",               # "min" because we want val_loss to decrease
    verbose=True
)

In [12]:
# define ligntning checkpoint
best_loss_checkpoint = L.callbacks.ModelCheckpoint(
    monitor="val_loss",
    mode="min",
    save_top_k=1,
)

In [13]:
# define model
deepfake_detector = LitFreqNet()

In [14]:
trainer = L.Trainer(
    devices=1,
    callbacks=[early_stop_callback, best_loss_checkpoint],
    default_root_dir=model_checkpoint_dir,
    log_every_n_steps=10,
    profiler="simple", # track time taken
    max_steps= max_epochs * max_samples / batch_size, #(desired_epochs × dataset_size) / batch_size
    # limit_train_batches=1000,   # how many batches per "epoch"
    # limit_val_batches=200,      # how many val batches per "epoch"
  )

INFO:pytorch_lightning.utilities.rank_zero:GPU available: False, used: False
INFO:pytorch_lightning.utilities.rank_zero:TPU available: False, using: 0 TPU cores
INFO:pytorch_lightning.utilities.rank_zero:HPU available: False, using: 0 HPUs


In [None]:
# train model
# trainer.fit(deepfake_detector, datamodule=sida_data_module)
trainer.fit(deepfake_detector, train_dataloaders=train_loader, val_dataloaders=val_loader)

INFO:pytorch_lightning.callbacks.model_summary:
   | Name       | Type              | Params | Mode 
----------------------------------------------------------
0  | model      | FreqNet           | 1.9 M  | train
1  | loss_fn    | BCEWithLogitsLoss | 0      | train
2  | train_acc  | BinaryAccuracy    | 0      | train
3  | val_acc    | BinaryAccuracy    | 0      | train
4  | test_acc   | BinaryAccuracy    | 0      | train
5  | train_prec | BinaryPrecision   | 0      | train
6  | val_prec   | BinaryPrecision   | 0      | train
7  | test_prec  | BinaryPrecision   | 0      | train
8  | train_rec  | BinaryRecall      | 0      | train
9  | val_rec    | BinaryRecall      | 0      | train
10 | test_rec   | BinaryRecall      | 0      | train
11 | train_f1   | BinaryF1Score     | 0      | train
12 | val_f1     | BinaryF1Score     | 0      | train
13 | test_f1    | BinaryF1Score     | 0      | train
14 | train_auc  | BinaryAUROC       | 0      | train
15 | val_auc    | BinaryAUROC       | 0      

Sanity Checking: |          | 0/? [00:00<?, ?it/s]

/usr/local/lib/python3.12/dist-packages/pytorch_lightning/utilities/data.py:123: Your `IterableDataset` has `__len__` defined. In combination with multi-process data loading (when num_workers > 1), `__len__` could be inaccurate if each worker is not configured independently to avoid having duplicate data.


Training: |          | 0/? [00:00<?, ?it/s]

In [None]:
# test dataset on unseen samples
# trainer.test(deepfake_detector, datamodule=sida_data_module)
trainer.test(deepfake_detector, test_loader)

In [None]:
# view metrics from previous runs
%reload_ext tensorboard
%tensorboard --logdir=$model_checkpoint_dir