In [1]:
pip install torch torchvision opencv-python numpy


Note: you may need to restart the kernel to use updated packages.



[notice] A new release of pip is available: 24.3.1 -> 25.0.1
[notice] To update, run: python.exe -m pip install --upgrade pip


In [44]:
import torch
import torch.nn as nn
import torchvision.models as models
import torchvision.transforms as transforms
from PIL import Image

# Create the model architecture
model = models.resnet50(pretrained=False)

# Get the input features dimension
in_features = model.fc.in_features

# Define the sequential structure with the correct dimensions
model.fc = nn.Sequential(
    nn.Linear(in_features, 512),  # fc.0 - First layer has 512 output features
    nn.ReLU(),                    # fc.1 (no parameters)
    nn.Dropout(0.5),              # fc.2 (no parameters)
    nn.Linear(512, 256),          # fc.3 - Second layer has 256 output features
    nn.ReLU(),                    # fc.4 (no parameters)
    nn.Dropout(0.5),              # fc.5 (no parameters)
    nn.Linear(256, 2)             # fc.6 - Final layer for binary classification
)

# Load the trained weights
model.load_state_dict(torch.load('best_deepfake_detector.pth', map_location=torch.device('cpu')))
model.eval()

ResNet(
  (conv1): Conv2d(3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)
  (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (relu): ReLU(inplace=True)
  (maxpool): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)
  (layer1): Sequential(
    (0): Bottleneck(
      (conv1): Conv2d(64, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)
      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
      (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (conv3): Conv2d(64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)
      (bn3): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (relu): ReLU(inplace=True)
      (downsample): Sequential(
        (0): Conv2d(64, 256, kernel_size=(1, 1), stride=(1, 

In [4]:
import torchvision.transforms as transforms
from PIL import Image

transform = transforms.Compose([
    transforms.Resize((224, 224)),
    transforms.ToTensor(),
    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
])

In [45]:
from PIL import Image
import torch
import cv2
import torchvision.transforms as transforms

def predict_image(frame):
    # Convert from BGR (OpenCV) to RGB (PIL)
    image = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
    image = transform(image).unsqueeze(0)
    
    with torch.no_grad():
        outputs = model(image)
        _, predicted = torch.max(outputs, 1)
        
    return predicted.item()


In [47]:
import cv2

video_path = '10sec_video.mp4'
cap = cv2.VideoCapture(video_path)
fps = cap.get(cv2.CAP_PROP_FPS)

frame_count = 0
real_count = 0
fake_count = 0

while True:
    ret, frame = cap.read()
    if not ret:
        break

    if frame_count % 3 == 0:
        if predict_image(frame) == 1:
            fake_count += 1
        else:
            real_count += 1

    frame_count += 1

real_prob = round(real_count / round(frame_count / 3)) * 100
fake_prob = round(fake_count / round(frame_count / 3)) * 100
print('Video is ' + str(real_prob) + '% real and ' + str(fake_prob) + '% fake')
cap.release()


Video is 100% real and 0% fake


In [None]:
import cv2

video_path = '30sec_video.mp4'
cap = cv2.VideoCapture(video_path)

frame_count = 0
real_count = 0
fake_count = 0

while True:
    ret, frame = cap.read()
    if not ret:
        break

    if frame_count % 3 == 0:
        if predict_image(frame) == 1:
            fake_count += 1
        else:
            real_count += 1

    frame_count += 1

real_prob = real_count / (frame_count / 3)
fake_prob = fake_count / (frame_count / 3)
print('Video is ' + str(real_prob) + '% real and ' + str(fake_prob) + '% fake')
# print('real_count: ', real_count)
# print('fake_count', fake_count)
# print(fps)
cap.release()


Video is 1.000984251968504% real and 0.0% fake


In [None]:
import cv2

video_path = '10sec_video1.mp4'
cap = cv2.VideoCapture(video_path)

frame_count = 0
real_count = 0
fake_count = 0

while True:
    ret, frame = cap.read()
    if not ret:
        break

    if frame_count % 3 == 0:
        if predict_image(frame) == 1:
            fake_count += 1
        else:
            real_count += 1

    frame_count += 1

real_prob = real_count / (frame_count / 3)
fake_prob = fake_count / (frame_count / 3)
print('Video is ' + str(real_prob) + '% real and ' + str(fake_prob) + '% fake')
# print('real_count: ', real_count)
# print('fake_count', fake_count)
# print(fps)
cap.release()


Video is 0.8493150684931506% real and 0.1506849315068493% fake


In [None]:
import cv2

video_path = '30sec_video.mp4'
cap = cv2.VideoCapture(video_path)

frame_count = 0
real_count = 0
fake_count = 0

while True:
    ret, frame = cap.read()
    if not ret:
        break

    if frame_count % 3 == 0:
        if predict_image(frame) == 1:
            fake_count += 1
        else:
            real_count += 1

    frame_count += 1

real_prob = real_count / (frame_count / 3)
fake_prob = fake_count / (frame_count / 3)
print('Video is ' + str(real_prob) + '% real and ' + str(fake_prob) + '% fake')
# print('real_count: ', real_count)
# print('fake_count', fake_count)
# print(fps)
cap.release()


Video is 1.0% real and 0.0% fake
