Import the necessary libraries

In [4]:
"""
This file downloads the train, test and validation datasets used for training the CNN.
We have used fiftyone's zoo library to download from the openImages v7.

The entire Open Images V7  database size is 561 GB, It contains ~9 million images that 
around 2 million of them are annotated (Classification, Detection, Segmentation, etc.).
The zoo library supports partial download of the entire dataset which helps a lot with 
our purpose.

* All images have been rescaled so that their largest dimension is at most 1024 pixels.
"""
import fiftyone as fo
import os
import fiftyone.zoo as foz
from pprint import pprint
import matplotlib.pyplot as plt
import matplotlib.image as mpimg # Necessary for reading an image
import matplotlib.patches as patches # Necessary for drawing bounding boxes
import json
import dataHandler as handler

Download the datasets using Fiftyone library. 

We download two datasets, one for training and the other for test

In [2]:
# Download the necessary data and dataset images for training. We have chosen "open-images-v7-object-detection-DS"
# as the name.
dsName = "open-images-v7-object-detection-DS-train"
dsClasses = ["Person"]
dsSplit = "train"
dsLblTypes = ["detections", "classifications"]
nSamples = 1000

if not fo.dataset_exists(dsName):
    dataset = foz.load_zoo_dataset(
        "open-images-v7",
        split = dsSplit,
        label_types = dsLblTypes,
        classes = dsClasses,
        max_samples = nSamples,
        seed = 1,
        shuffle = True,
        dataset_name = dsName,
    )
else:
    datasetTrain = fo.load_dataset(dsName)
    print("Dataset already loaded.")

Dataset already loaded.


In [3]:
# Download the necessary data and dataset images for testing. We have chosen "open-images-v7-object-detection-DS"
# as the name.
dsName = "open-images-v7-object-detection-DS-test"
dsClasses = ["Person"]
dsSplit = "test"
dsLblTypes = ["detections", "classifications"]
nSamples = 1000

if not fo.dataset_exists(dsName):
    dataset = foz.load_zoo_dataset(
        "open-images-v7",
        split = dsSplit,
        label_types = dsLblTypes,
        classes = dsClasses,
        max_samples = nSamples,
        seed = 2,
        shuffle = True,
        dataset_name = dsName,
    )
else:
    datasetTest = fo.load_dataset(dsName)
    print("Dataset already loaded. ")

Dataset already loaded. 


In [None]:
# To be sure of the downloaded datasets, you can run the code below to see the downloaded datasets
# List the current datasets
fo.list_datasets()

Exporting the datasets to two directories. Each one containing two sub-directories, namely, images and labels

In [11]:
# Exporting the downloaded datasets to the desired locations.
# Check if the path exists
if not os.path.isdir("./data/images/train/"):
    os.makedirs("./data/images/train/", exist_ok = True)
if not os.path.isdir("./data/labels/train/"):
    os.makedirs("./data/labels/train/", exist_ok = True)

# Test data
datasetTrain.export(
    data_path = "./data/images/train",
    labels_path = "./data/labels/train/labels.json",
    dataset_type = fo.types.FiftyOneImageDetectionDataset,
    classes = dsClasses,
    include_confidence = False
)

# Check if the path exists
if not os.path.isdir("./data/images/test"):
    os.makedirs("./data/images/test", exist_ok = True)
if not os.path.isdir("./data/labels/test/"):
    os.makedirs("./data/labels/test/", exist_ok = True)
# Test data
datasetTest.export(
    data_path = "./data/images/test",
    labels_path = "./data/labels/test/labels.json",
    dataset_type = fo.types.FiftyOneImageDetectionDataset,
    classes = dsClasses,
    include_confidence = False
)

Directory './data/images/train' already exists; export will be merged with existing files
   2% |---------------|   22/1000 [237.0ms elapsed, 10.5s remaining, 92.8 samples/s] 



   5% ||--------------|   47/1000 [444.6ms elapsed, 9.0s remaining, 105.7 samples/s] 



   7% |█--------------|   72/1000 [659.3ms elapsed, 8.5s remaining, 109.2 samples/s] 



  10% |█|-------------|   96/1000 [871.5ms elapsed, 8.2s remaining, 110.2 samples/s] 



  13% |█\-------------|  132/1000 [1.2s elapsed, 7.9s remaining, 112.6 samples/s]    



  17% |██-------------|  170/1000 [1.5s elapsed, 7.4s remaining, 112.7 samples/s]    



  19% |██|------------|  193/1000 [1.7s elapsed, 7.3s remaining, 109.7 samples/s]    



  21% |███------------|  211/1000 [2.0s elapsed, 7.3s remaining, 114.2 samples/s]    



  24% |███/-----------|  241/1000 [2.3s elapsed, 7.3s remaining, 102.1 samples/s]    



                                                                                     



  30% |████-----------|  298/1000 [2.8s elapsed, 6.8s remaining, 97.8 samples/s]     



  32% |████|----------|  322/1000 [3.0s elapsed, 6.4s remaining, 104.2 samples/s]    



  35% |█████----------|  350/1000 [3.3s elapsed, 5.9s remaining, 112.8 samples/s]    



  38% |█████|---------|  379/1000 [3.5s elapsed, 5.4s remaining, 126.2 samples/s]    



  41% |██████---------|  409/1000 [3.7s elapsed, 5.1s remaining, 126.4 samples/s]    



  43% |██████|--------|  433/1000 [3.9s elapsed, 4.8s remaining, 128.3 samples/s]    



  46% |██████---------|  456/1000 [4.1s elapsed, 4.7s remaining, 123.3 samples/s]    



  48% |███████/-------|  484/1000 [4.5s elapsed, 4.8s remaining, 105.9 samples/s]    



  52% |███████|-------|  521/1000 [4.8s elapsed, 4.5s remaining, 102.0 samples/s]    



  56% |████████\------|  556/1000 [5.1s elapsed, 4.1s remaining, 105.0 samples/s]    



  60% |████████\------|  595/1000 [5.5s elapsed, 3.9s remaining, 103.1 samples/s]    



  63% |█████████------|  631/1000 [5.8s elapsed, 3.5s remaining, 101.8 samples/s]    



  67% |██████████-----|  672/1000 [6.3s elapsed, 3.3s remaining, 97.5 samples/s]     



  69% |██████████|----|  694/1000 [6.5s elapsed, 3.0s remaining, 100.3 samples/s]    



  71% |██████████\----|  713/1000 [6.8s elapsed, 3.2s remaining, 83.8 samples/s]     



  73% |██████████-----|  727/1000 [7.2s elapsed, 3.9s remaining, 62.3 samples/s]     



  78% |███████████----|  779/1000 [8.6s elapsed, 4.4s remaining, 44.0 samples/s]     



  80% |███████████|---|  795/1000 [8.8s elapsed, 3.4s remaining, 55.5 samples/s]     



  83% |████████████|--|  827/1000 [9.2s elapsed, 2.3s remaining, 71.3 samples/s]     



  86% |████████████|--|  859/1000 [9.6s elapsed, 1.9s remaining, 74.4 samples/s]     



  91% |█████████████/-|  910/1000 [10.1s elapsed, 1.0s remaining, 87.4 samples/s]    



  93% |█████████████\-|  928/1000 [10.4s elapsed, 808.8ms remaining, 89.0 samples/s] 



  95% |██████████████/|  947/1000 [10.6s elapsed, 562.6ms remaining, 94.5 samples/s] 



 100% |███████████████| 1000/1000 [11.1s elapsed, 0s remaining, 99.3 samples/s]       
Directory './data/images/test' already exists; export will be merged with existing files
   1% |---------------|    9/1000 [791.1ms elapsed, 1.5m remaining, 11.4 samples/s] 



   1% ||--------------|   14/1000 [1.0s elapsed, 1.2m remaining, 13.6 samples/s]    



   4% |\--------------|   37/1000 [1.4s elapsed, 35.4s remaining, 27.2 samples/s]   



   5% |/--------------|   54/1000 [1.6s elapsed, 27.5s remaining, 34.4 samples/s]   



   8% |█\-------------|   78/1000 [1.8s elapsed, 20.5s remaining, 69.6 samples/s]   



  10% |█/-------------|   95/1000 [2.0s elapsed, 18.2s remaining, 84.5 samples/s]   



  13% |█/-------------|  129/1000 [2.5s elapsed, 16.2s remaining, 81.4 samples/s]   



  15% |██\------------|  147/1000 [2.7s elapsed, 15.2s remaining, 76.8 samples/s]   



  17% |██/------------|  167/1000 [2.9s elapsed, 14.1s remaining, 74.7 samples/s]   



  19% |██\------------|  190/1000 [3.2s elapsed, 12.5s remaining, 93.5 samples/s]   



  21% |███------------|  214/1000 [3.5s elapsed, 11.9s remaining, 88.7 samples/s]   



  26% |███\-----------|  265/1000 [4.0s elapsed, 10.2s remaining, 93.9 samples/s]   



  28% |████/----------|  278/1000 [4.2s elapsed, 10.3s remaining, 82.7 samples/s]   



  31% |████|----------|  306/1000 [4.5s elapsed, 9.7s remaining, 84.2 samples/s]    



  33% |████-----------|  326/1000 [4.8s elapsed, 9.3s remaining, 84.1 samples/s]    



  36% |█████/---------|  356/1000 [5.1s elapsed, 8.6s remaining, 84.9 samples/s]    



  42% |██████\--------|  422/1000 [5.7s elapsed, 7.0s remaining, 100.6 samples/s]   



  45% |██████\--------|  454/1000 [6.2s elapsed, 6.9s remaining, 88.4 samples/s]    



  55% |████████-------|  551/1000 [7.3s elapsed, 5.9s remaining, 76.0 samples/s]    



  57% |████████/------|  574/1000 [7.7s elapsed, 5.9s remaining, 71.0 samples/s]    



  60% |█████████/-----|  601/1000 [8.1s elapsed, 5.5s remaining, 71.7 samples/s]    



  63% |█████████|-----|  629/1000 [8.4s elapsed, 5.1s remaining, 71.6 samples/s]    



  65% |█████████------|  649/1000 [8.6s elapsed, 4.6s remaining, 76.8 samples/s]    



  66% |█████████|-----|  665/1000 [8.8s elapsed, 4.2s remaining, 81.9 samples/s]    



  70% |██████████\----|  695/1000 [9.2s elapsed, 3.6s remaining, 88.4 samples/s]    



  75% |███████████----|  752/1000 [9.9s elapsed, 3.1s remaining, 82.7 samples/s]    



  77% |███████████|---|  770/1000 [10.2s elapsed, 3.1s remaining, 73.7 samples/s]   



  80% |████████████/--|  805/1000 [11.2s elapsed, 3.9s remaining, 46.1 samples/s]   



  83% |████████████\--|  827/1000 [11.4s elapsed, 3.2s remaining, 51.4 samples/s]   



  85% |████████████---|  853/1000 [11.7s elapsed, 1.8s remaining, 81.9 samples/s]   



                                                                                    



  92% |█████████████/-|  925/1000 [12.5s elapsed, 820.2ms remaining, 93.2 samples/s] 



  96% |██████████████/|  959/1000 [12.9s elapsed, 475.3ms remaining, 86.9 samples/s] 



  99% |██████████████||  988/1000 [13.2s elapsed, 145.3ms remaining, 82.7 samples/s] 



 100% |███████████████| 1000/1000 [13.4s elapsed, 0s remaining, 83.1 samples/s]      


In [12]:
# Deserialize the json file and convert it to text files to make it compatible with YOLO-v1
# Training dataset
file = open("./data/labels/train/labels.json")
js = json.load(file)
for item in js["labels"]:
    txt = ""
    with open(f"./data/labels/train/{item}.txt", 'w') as txtFile:
        for subItem in js["labels"][item]: 
            width = subItem["bounding_box"][2]
            height = subItem["bounding_box"][3]
            centerX = subItem["bounding_box"][0] + width/2
            centerY = subItem["bounding_box"][1] + height/2
            label = subItem["label"]
            txt += f"{label} {centerX} {centerY} {width} {height}\n"
        txtFile.write(txt)
        txtFile.close()
    

file = open("./data/labels/test/labels.json")
js = json.load(file)
for item in js["labels"]:
    txt = ""
    with open(f"./data/labels/test/{item}.txt", 'w') as txtFile:
        for subItem in js["labels"][item]: 
            width = subItem["bounding_box"][2]
            height = subItem["bounding_box"][3]
            centerX = subItem["bounding_box"][0] + width/2
            centerY = subItem["bounding_box"][1] + height/2
            label = subItem["label"]
            txt += f"{label} {centerX} {centerY} {width} {height}\n"
        txtFile.write(txt)
        txtFile.close()
    

View the downloaded datasets. Might not work on the server-side.

In [None]:
# See the samples
aa = fo.load_dataset("open-images-v7-object-detection-DS-test")
session = fo.launch_app(aa.view())

Process the datasets

In [17]:
# Remove grayscale images 

import os
from PIL import Image
import numpy as np

files = os.listdir("./data/images/test")

for file in files:
    img = np.array(Image.open("./data/images/test/"+file))
    if img.ndim == 2:
        print(f"Removed image {file} and its respective label.")
        os.remove("./data/images/test/"+file)
        os.remove("./data/labels/test/"+file.replace(".jpg",".txt"))

In [16]:
# Remove images with four channels
# Alternatively, you can replace the image as well.

import os
from PIL import Image
import numpy as np

files = os.listdir("./data/images/test")

for file in files:
    img = np.array(Image.open("./data/images/test/"+file))
    if img.shape[2] == 4:
        print(f"Removed image {file} and its respective label.")
        os.remove("./data/images/test/"+file)
        os.remove("./data/labels/test/"+file.replace(".jpg",".txt"))