In [2]:
%matplotlib inline
from preprocessing_util import *
from util import create_train_test_sets
from facenet_pytorch import MTCNN
import torch

run_on_gpu = True


# Check if CUDA support is available
if run_on_gpu:
    if torch.cuda.is_available():
        device = torch.device("cuda: 0")
    else:
        device = torch.device("cpu")
    print(f'Running on device: {device}')

else:
    device = torch.device("cpu")
    print(f'Running on device: {device}')  

Running on device: cuda:0


## First we need to setup data folders

Required:

1. Path to raw data
2. Path to store non-augmented data
3. Path to store augmented data

In [3]:
path_to_raw_data = 'jointdata/' # path to raw data
path_to_store_faces = 'data/nontemp/faces/' # path to store non-augmented data
path_to_store_faces_aug = 'data/nontemp/faces_aug/' # path to store augmented data


### First load the face detection module

In [4]:
# Load face detector
face_detector = MTCNN(image_size=224, margin=10, keep_all=False, device=device, post_process=False).eval()

### Config
Specify the amount of frames extracted per real file. If this is adapted, this needs to be changed as well separately for fake files.

E.g. for the Celeb-DF dataset:

There are 890 real files: 890 * 65 = 57.850
There are 5.639 fake files: 5.639 * 10 = 56.390

So the current configuration results in a balanced dataset. Note that only multiples of 5 can be selected when extracting temporal data, because the sequence length for the face sequences is set to 5 for the LSTM.

Also, a minimum face detection threshold can be set to disregard files which result in a large proportion of frames not detecting any faces.

Finally, specify whether the derived dataset should be aimed at training temporal, or non-temporal models. Currently, both model types can only be trained using their respective dataset.

In [5]:
n_frames = 45
min_face_cutoff = 20
temporal = False

# Load facial detection pipeline
face_detection = FaceDetection(face_detector, device, n_frames=n_frames)

# enable logging plots, if this is true, no face images will be saved, just the plots
log_plots = False

# Extract the dataset
Extract one subfolder after another. We keep track of the labels for each datapoint via stored csv files.


In [5]:
# celeb-real folder
path_to_folder =  path_to_raw_data + 'real/'
name_csv = 'real'
label = 'Real'

labels = get_CDF_per_folder(path_to_data=path_to_folder,
                            path_to_store_faces=path_to_store_faces,
                            path_to_store_faces_aug=path_to_store_faces_aug,
                            face_detection=face_detection,
                            label=label,
                            csv_file_name=name_csv,
                            min_face_cutoff=min_face_cutoff,
                            temporal = temporal,
                            log_plots=log_plots)

Extracting  faces from 2099 Real files


HBox(children=(FloatProgress(value=0.0, max=2099.0), HTML(value='')))

[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 46]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 46]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 46]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted fac

[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 43]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted fac

[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 46]
[# extracted faces: 45]
[# extracted faces: 44]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 44]
[# extracted faces: 43]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted fac

[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted fac

[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted fac

[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 46]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 46]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted fac

[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 46]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 46]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted faces: 45]
[# extracted fac

We have now derived data from all real files. Next we need to derive data from the fake files.
As mentioned, this needs to be done with different number of frames per file, to ensure a balanced dataset.
Make sure both n_frame instances produce an even amount of datapoints (see above).

In [7]:
# need to initialize a new face detection model for smaller amount of frames
n_frames = 10
min_face_cutoff = 5
face_detection = FaceDetection(face_detector, device, n_frames=n_frames)

In [7]:
# synthesis folder
path_to_folder =  path_to_raw_data + 'fake/'
name_csv = 'fake'
label = 'Fake'

labels = get_CDF_per_folder(path_to_data=path_to_folder,
                            path_to_store_faces=path_to_store_faces,
                            path_to_store_faces_aug=path_to_store_faces_aug,
                            face_detection=face_detection,
                            label=label,
                            csv_file_name=name_csv,
                            min_face_cutoff=min_face_cutoff,
                            temporal = temporal,
                            log_plots=log_plots)

Extracting  faces from 9639 Fake files


HBox(children=(FloatProgress(value=0.0, max=9639.0), HTML(value='')))

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 9]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted face

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted fac

In [8]:
# synthesis folder
path_to_folder =  'realworld/fake/'
name_csv = 'rwfake'
label = 'Fake'

labels = get_CDF_per_folder(path_to_data=path_to_folder,
                            path_to_store_faces=path_to_store_faces,
                            path_to_store_faces_aug=path_to_store_faces_aug,
                            face_detection=face_detection,
                            label=label,
                            csv_file_name=name_csv,
                            min_face_cutoff=min_face_cutoff,
                            temporal = temporal,
                            log_plots=log_plots)

Extracting  faces from 140 Fake files


HBox(children=(FloatProgress(value=0.0, max=140.0), HTML(value='')))

[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 9]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted faces: 10]
[# extracted face

## Label merging
For each folder, we have a respective label file. Those need to be merged.
For each dataset, we handle two different types of labels.

1. Per file labels
2. Per datapoint labels (per face image for non-temporal models, per face-window for temporal models)


First we merge the labels on file-level.

In [9]:
path = "Labels/"
file1 = "real_labels_per_file.csv"
file2 = "fake_labels_per_file.csv"
file3 = 'rwfake_labels_per_file.csv'


labels_per_file = combine_labels(path, file1, file2, file3)
labels_per_file.to_csv("Labels/labels_per_file.csv")
labels_per_file

Unnamed: 0,file,label
0,000.mp4,0
1,00000.mp4,0
2,00001.mp4,0
3,00002.mp4,0
4,00003.mp4,0
...,...,...
11872,fake_95.mp4,1
11873,fake_96.mp4,1
11874,fake_97.mp4,1
11875,fake_98.mp4,1


Next we merge the labels on datapoint-level.

In [10]:
path = "Labels/"
file1 = f"real_labels_per_{'face' if not temporal else 'face_window'}.csv"
file2 = f"fake_labels_per_{'face' if not temporal else 'face_window'}.csv"
file3 = f"rwfake_labels_per_{'face' if not temporal else 'face_window'}.csv"

labels_per_face = combine_labels(path, file1, file2, file3)
labels_per_face.to_csv(f"Labels/labels_per_{'face' if not temporal else 'face_window'}.csv")
labels_per_face

Unnamed: 0,file,label
0,000_000.mp4,0
1,001_000.mp4,0
2,002_000.mp4,0
3,003_000.mp4,0
4,004_000.mp4,0
...,...,...
192188,005_fake_99.mp4,1
192189,006_fake_99.mp4,1
192190,007_fake_99.mp4,1
192191,008_fake_99.mp4,1


## Create splits

Now that we have the datasets and labels, we can perform the train/val/test split. We do this on file level.
For this, we can adapt the size of the training set. The resulting proportion of the dataset will be evenly split into validation/testing sets.

In [11]:
train_size = 0.8

Do the split. The resulting label files per split will be stored in the root folders where the data is located.

In [None]:
labels_per_file = 'Labels/labels_per_file.csv'
labels_per_face = 'Labels/labels_per_face.csv'


create_train_test_sets(labels_per_file=labels_per_file,
                       labels_per_face=labels_per_face,
                       root_dir=path_to_store_faces,
                       root_dir_aug=path_to_store_faces_aug,
                       train_size=train_size,
                       temporal=temporal)

Deriving the correct face labels for the split...


HBox(children=(FloatProgress(value=0.0, max=9501.0), HTML(value='')))