datasetCreationUtils.py

import cv2
import os
import random
import numpy as np
import pandas as pd

# Global counting of the data
folder_count = 0
frame_lab = ['a', 'b', 'c']
PATH = ''
# For each video in the list, extract some frames
def extractFromVideos(lst, dir_out):
  PATH = dir_out
  os.mkdir(PATH)
  for elem in lst:
    extractFrames("/content/Hollywood2/AVIClips/"+elem, PATH)
    print(elem)
 
# At each video passed, extract 3 frames every 10, and grouping them in a subfolder
def extractFrames(pathIn, pathOut):
    FPS = 25
 
    cap = cv2.VideoCapture(pathIn)
    count = 0
 
    global folder_count
 
    rel_path = pathOut
    os.makedirs(pathOut, exist_ok=True)
    while (cap.isOpened()):
        # Capture frame-by-frame
        ret, frame = cap.read()
 
        if ret == True:
            if(count%FPS == 0 or count%FPS == 1 or count%FPS == 2):
              if(count%FPS == 0 ):
                # final_path = rel_path+"{:d}/".format(folder_count)
 
                folder_count = int(folder_count) + 1
              cv2.imwrite(os.path.join(pathOut, "frame"+str(folder_count)+frame_lab[count%FPS]+".jpg"), frame)  # save frame as JPEG file
            count += 1
        else:
            break
 
    # When everything done, release the capture
    cap.release()
    cv2.destroyAllWindows()

#function to crop a square image of 150 x 150 around a given pixel
def crop_image(path, cx, cy):
    
  
  #try to read the image (to make sure it exists)
  try:
    img = cv2.imread(path)
  except:
    print('Cannot read: ',path)
    return []

  return img[int(cy-75):int(cy+75), int(cx-75):int(cx+75),:]

# Function which takes every triplet of images in the dataset and extract 25 
# random patches of 150 x 150. It stores them in a folder that will be then compressed
# and saves the files path in a pandas dataframe, which will be used later to load 
# the data in tensorflow
def build_dataset(img_c):
  random.seed(10)
  data = pd.DataFrame(columns=['frameA', 'frameB','frameC', 'x', 'y'])

  idx = 0

  for i in range(1, img_c + 1):
    sh = cv2.imread('/content/images/frame'+str(i)+'a.jpg').shape[0:2]
    #print(sh)
    x = np.random.randint(75, sh[1] - 75, 25)
    y = np.random.randint(75, sh[0] - 75, 25)
    #print(sh[1])
    for j in range(len(x)):

      imgA = crop_image('./images/frame'+str(i)+'a.jpg', x[j], y[j])
      imgB = crop_image('./images/frame'+str(i)+'b.jpg', x[j], y[j])
      imgC = crop_image('./images/frame'+str(i)+'c.jpg', x[j], y[j])

      if(imgB.shape != (0,) and imgC.shape != (0,)):
        
        path = './crops/'+str(idx)+'/'
        os.makedirs(path, exist_ok=True)
        cv2.imwrite(path +'a.jpg', np.float32(imgA))
        cv2.imwrite(path +'b.jpg', np.float32(imgB))
        cv2.imwrite(path +'c.jpg',  np.float32(imgC))
        data.loc[idx] = ['./crops/'+str(idx)+'/a.jpg','./crops/'+str(idx)+'/b.jpg', './crops/'+str(idx)+'/c.jpg', x[j], y[j]]
        #df = df.append({'A': i}, ignore_index=True)
        idx += 1

    if(i%1000 == 0):
      print(i)

  return data