In [1]:
# import the necessary packages
from imutils import paths
import face_recognition
import pickle
import cv2
import os

In [8]:
def encode_face_data():
    # grab the paths to the input images in our dataset
    print("[INFO] quantifying faces...")
    
    # Face recognition dataset
    dataset = 'face_recognition_dataset/'
    
    # Output encoding file
    encodings_file = 'encodings.pickle'
    
    # Face detection method (cnn or hog)
    detection_method = 'cnn'
    imagePaths = list(paths.list_images(dataset))
    
    # initialize the list of known encodings and known names
    knownEncodings = []
    knownNames = []
    
    # loop over the image paths
    for (i, imagePath) in enumerate(imagePaths):
        
        # extract the person name from the image path
        print("[INFO] processing image {}/{}".format(i + 1,
            len(imagePaths)))
        name = imagePath.split(os.path.sep)[-2]
        
        # load the input image and convert it from BGR (OpenCV ordering)
        # to dlib ordering (RGB)
        image = cv2.imread(imagePath)
        rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
        
        # detect the (x, y)-coordinates of the bounding boxes
        # corresponding to each face in the input image
        # face_recognition.face_locations
        """img – An image (as a numpy array)
        number_of_times_to_upsample – How many times to upsample the 
        image looking for faces. Higher numbers find smaller faces.
        model – Which face detection model to use. “hog” is less 
        accurate but faster on CPUs. “cnn” is a more accurate 
        deep-learning model which is GPU/CUDA accelerated (if 
        available). The default is “hog”.
        Returns: A list of tuples of found face locations in css (top,
        right, bottom, left) order"""
        boxes = face_recognition.face_locations(rgb,
            model=detection_method)
        
        
        # compute the facial embedding for the face
        # face_encodings()
        """face_image – The image that contains one or more faces
        known_face_locations – Optional - the bounding boxes of each
        face if you already know them.
        Returns: A list of 128-dimensional face encodings (one for
        each face in the image)"""
        encodings = face_recognition.face_encodings(rgb, boxes)
        
        # loop over the encodings
        for encoding in encodings:
            # add each encoding + name to our set of known names and
            # encodings
            knownEncodings.append(encoding)
            knownNames.append(name)


    # dump the facial encodings + names to disk
    print("[INFO] serializing encodings... to ",encodings_file)
    data = {"encodings": knownEncodings, "names": knownNames}
    f = open(encodings_file, "wb")
    f.write(pickle.dumps(data))
    f.close()        
    print("Total Images Encoded:", len(knownNames))
    print("Total Faces Encoded:", len(set(knownNames)))

In [7]:
encode_face_data()

[INFO] quantifying faces...
[INFO] processing image 1/18
[INFO] processing image 2/18
[INFO] processing image 3/18
[INFO] processing image 4/18
[INFO] processing image 5/18
[INFO] processing image 6/18
[INFO] processing image 7/18
[INFO] processing image 8/18
[INFO] processing image 9/18
[INFO] processing image 10/18
[INFO] processing image 11/18
[INFO] processing image 12/18
[INFO] processing image 13/18
[INFO] processing image 14/18
[INFO] processing image 15/18
[INFO] processing image 16/18
[INFO] processing image 17/18
[INFO] processing image 18/18
[INFO] serializing encodings... to  encodings.pickle
Total Images Encoded: 18
Total Faces Encoded: 2
['parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'parikh', 'chaitanya']
