# Face Recognition using Transfer Learning on VGG16

## Creating images dataset using opencv through webcam

In [None]:
import cv2
import numpy as np

# Load HAAR face classifier
face_classifier = cv2.CascadeClassifier('haarcascade_frontalface_default.xml')

# Load functions
def face_extractor(img):
    # Function detects faces and returns the cropped face
    # If no face detected, it returns the input image
    
    gray = cv2.cvtColor(img,cv2.COLOR_BGR2GRAY)
    faces = face_classifier.detectMultiScale(gray, 1.3, 5)
    
    if faces is ():
        return None
    
    # Crop all faces found
    for (x,y,w,h) in faces:
        cropped_face = img[y:y+h, x:x+w]

    return cropped_face

# Initialize Webcam
cap = cv2.VideoCapture(0)
count = 0

# Collect 1000 samples of your face from webcam input
while True:

    ret, frame = cap.read()
    if face_extractor(frame) is not None:
        count += 1
        face = cv2.resize(face_extractor(frame), (200, 200))
        face = cv2.cvtColor(face, cv2.COLOR_BGR2GRAY)

        # Save file in specified directory with unique name
        file_name_path = 'C://Users//vivekPC//Desktop//MLOps WS//FRTL//FRsamples//vivek' + str(count) + '.jpg'
        cv2.imwrite(file_name_path, face)

        # Put count on images and display live count
        cv2.putText(face, str(count), (50, 50), cv2.FONT_HERSHEY_COMPLEX, 1, (0,255,0), 2)
        cv2.imshow('Face Cropper', face)
        
    else:
        print("Face not found")
        pass

    if cv2.waitKey(1) == 13 or count == 1000: #13 is the Enter Key
        break
        
cap.release()
cv2.destroyAllWindows()      
print("Collecting Samples Complete")

## Loading the VGG16 Model and freezing all layers except the top 4

In [2]:
from keras.applications import VGG16

# VGG16 was designed to work on 224 x 224 pixel input images sizes
img_rows = 224
img_cols = 224 

# loads the VGG16 model without the top or FC layers
model = VGG16(weights = 'imagenet', 
                 include_top = False, 
                 input_shape = (img_rows, img_cols, 3))

# Here we freeze the last 4 layers 
# Layers are set to trainable as True by default
for layer in model.layers:
    layer.trainable = False
    
# Let's print our layers 
for (i,layer) in enumerate(model.layers):
    print(str(i) + " "+ layer.__class__.__name__, layer.trainable)

Using TensorFlow backend.


0 InputLayer False
1 Conv2D False
2 Conv2D False
3 MaxPooling2D False
4 Conv2D False
5 Conv2D False
6 MaxPooling2D False
7 Conv2D False
8 Conv2D False
9 Conv2D False
10 MaxPooling2D False
11 Conv2D False
12 Conv2D False
13 Conv2D False
14 MaxPooling2D False
15 Conv2D False
16 Conv2D False
17 Conv2D False
18 MaxPooling2D False


## Making a function that returns our Fully Connected Head

In [3]:
def addTopModel(bottom_model, num_classes, D=256):
    """creates the top or head of the model that will be 
    placed ontop of the bottom layers"""
    top_model = bottom_model.output
    top_model = Flatten(name = "flatten")(top_model)
    top_model = Dense(D, activation = "relu")(top_model)
    top_model = Dropout(0.3)(top_model)
    top_model = Dense(num_classes, activation = "softmax")(top_model)
    return top_model

model.input

<tf.Tensor 'input_1:0' shape=(None, 224, 224, 3) dtype=float32>

## Getting model layers

In [4]:
model.layers

[<keras.engine.input_layer.InputLayer at 0x1b8fc156d08>,
 <keras.layers.convolutional.Conv2D at 0x1b88afca208>,
 <keras.layers.convolutional.Conv2D at 0x1b88afca848>,
 <keras.layers.pooling.MaxPooling2D at 0x1b88afedb48>,
 <keras.layers.convolutional.Conv2D at 0x1b88b004ac8>,
 <keras.layers.convolutional.Conv2D at 0x1b88b2105c8>,
 <keras.layers.pooling.MaxPooling2D at 0x1b88b212a48>,
 <keras.layers.convolutional.Conv2D at 0x1b88b216e48>,
 <keras.layers.convolutional.Conv2D at 0x1b88b21c308>,
 <keras.layers.convolutional.Conv2D at 0x1b88b21cdc8>,
 <keras.layers.pooling.MaxPooling2D at 0x1b88b223c08>,
 <keras.layers.convolutional.Conv2D at 0x1b88b227f88>,
 <keras.layers.convolutional.Conv2D at 0x1b88b22d1c8>,
 <keras.layers.convolutional.Conv2D at 0x1b88b2301c8>,
 <keras.layers.pooling.MaxPooling2D at 0x1b88b233e88>,
 <keras.layers.convolutional.Conv2D at 0x1b88b234888>,
 <keras.layers.convolutional.Conv2D at 0x1b88b23d448>,
 <keras.layers.convolutional.Conv2D at 0x1b88b23e848>,
 <keras.

## Adding our FC Head back onto VGG16 and get summary

In [5]:
from keras.models import Sequential
from keras.layers import Dense, Dropout, Activation, Flatten
from keras.layers import Conv2D, MaxPooling2D, ZeroPadding2D
from keras.layers.normalization import BatchNormalization
from keras.models import Model

num_classes = 2

FC_Head = addTopModel(model, num_classes)

modelnew = Model(inputs=model.input, outputs=FC_Head)

print(modelnew.summary())

Model: "model_1"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_1 (InputLayer)         (None, 224, 224, 3)       0         
_________________________________________________________________
block1_conv1 (Conv2D)        (None, 224, 224, 64)      1792      
_________________________________________________________________
block1_conv2 (Conv2D)        (None, 224, 224, 64)      36928     
_________________________________________________________________
block1_pool (MaxPooling2D)   (None, 112, 112, 64)      0         
_________________________________________________________________
block2_conv1 (Conv2D)        (None, 112, 112, 128)     73856     
_________________________________________________________________
block2_conv2 (Conv2D)        (None, 112, 112, 128)     147584    
_________________________________________________________________
block2_pool (MaxPooling2D)   (None, 56, 56, 128)       0   

## Loading our face sample Dataset
### Point to noted here is that we split our dataset in two parts - Training & Testing. For training we give only 80% of data (800 face images) and remaining 20% (200 face images) for testing/validation

In [6]:
from keras.preprocessing.image import ImageDataGenerator

train_data_dir = 'FRsamples/train/'
validation_data_dir = 'FRsamples/validation/'

train_datagen = ImageDataGenerator(
      rescale=1./255,
      rotation_range=20,
      width_shift_range=0.2,
      height_shift_range=0.2,
      horizontal_flip=True,
      fill_mode='nearest')
 
validation_datagen = ImageDataGenerator(rescale=1./255)
 
# Change the batchsize according to your system RAM
train_batchsize = 16
val_batchsize = 10
 
train_generator = train_datagen.flow_from_directory(
        train_data_dir,
        target_size=(img_rows, img_cols),
        batch_size=train_batchsize,
        class_mode='categorical')
 
validation_generator = validation_datagen.flow_from_directory(
        validation_data_dir,
        target_size=(img_rows, img_cols),
        batch_size=val_batchsize,
        class_mode='categorical',
        shuffle=False)

Found 1600 images belonging to 2 classes.
Found 400 images belonging to 2 classes.


## Training our top layers and saving model 

In [7]:
from keras.optimizers import RMSprop
from keras.callbacks import ModelCheckpoint, EarlyStopping
                   
checkpoint = ModelCheckpoint("FRTL_vgg.h5",
                             monitor="val_loss",
                             mode="min",
                             save_best_only = True,
                             verbose=1)

earlystop = EarlyStopping(monitor = 'val_loss', 
                          min_delta = 0, 
                          patience = 3,
                          verbose = 1,
                          restore_best_weights = True)

# we put our call backs into a callback list
callbacks = [earlystop, checkpoint]

# Note we use a very small learning rate 
modelnew.compile(loss = 'categorical_crossentropy',
              optimizer = RMSprop(lr = 0.001),
              metrics = ['accuracy'])

nb_train_samples = 1600
nb_validation_samples = 400

# We only train 3 EPOCHS 
epochs = 3
batch_size = 16

history = modelnew.fit_generator(
    train_generator,
    steps_per_epoch = nb_train_samples // batch_size,
    epochs = epochs,
    callbacks = callbacks,
    validation_data = validation_generator,
    validation_steps = nb_validation_samples // batch_size)

modelnew.save("FRTL_vgg.h5")

Epoch 1/3

Epoch 00001: val_loss improved from inf to 0.07150, saving model to FRTL_vgg.h5
Epoch 2/3

Epoch 00002: val_loss improved from 0.07150 to 0.01531, saving model to FRTL_vgg.h5
Epoch 3/3

Epoch 00003: val_loss improved from 0.01531 to 0.00190, saving model to FRTL_vgg.h5


## As we can see above ...
### In first epoch our model has 72% accuracy, it gets 91% on second and finally in third epoch it increased upto 95% accuracy and validation accuracy is 100% means it can predict all the input images. 

## Loading our saved model as a classifier

In [27]:
from keras.models import load_model

classifier = load_model('FRTL_vgg.h5')

## Testing our classifier on some test images : Predicting Face Recognition

In [40]:
import os
import cv2
import numpy as np
from os import listdir
from os.path import isfile, join

FRsample_dict = {"[0]": "vedant", 
                      "[1]": "vivek"}

FRsample_dict_n = {"vedant": "Vedant ", 
                      "vivek": "Vivek"}

def draw_test(name, pred, im):
    FRsamples = FRsample_dict[str(pred)]
    BLACK = [0,0,0]
    expanded_image = cv2.copyMakeBorder(im, 80, 0, 0, 100 ,cv2.BORDER_CONSTANT,value=BLACK)
    cv2.putText(expanded_image, FRsamples, (20, 60) , cv2.FONT_HERSHEY_SIMPLEX,1, (0,0,255), 2)
    cv2.imshow(name, expanded_image)

def getRandomImage(path):
    """function loads a random images from a random folder in our test path """
    folders = list(filter(lambda x: os.path.isdir(os.path.join(path, x)), os.listdir(path)))
    random_directory = np.random.randint(0,len(folders))
    path_class = folders[random_directory]
    print("Class - " + FRsample_dict_n[str(path_class)])
    file_path = path + path_class
    file_names = [f for f in listdir(file_path) if isfile(join(file_path, f))]
    random_file_index = np.random.randint(0,len(file_names))
    image_name = file_names[random_file_index]
    return cv2.imread(file_path+"/"+image_name)    

# Randomly t
for i in range(0,20):
    input_im = getRandomImage("FRsamples/validation/")
    input_original = input_im.copy()
    input_original = cv2.resize(input_original, None, fx=0.5, fy=0.5, interpolation = cv2.INTER_LINEAR)
    
    input_im = cv2.resize(input_im, (224, 224), interpolation = cv2.INTER_LINEAR)
    input_im = input_im / 255.
    input_im = input_im.reshape(1,224,224,3) 
    
    # Get Prediction
    res = np.argmax(classifier.predict(input_im, 1, verbose = 0), axis=1)
    
    # Show image with predicted class
    draw_test("Prediction", res, input_original) 
    cv2.waitKey(0)
cv2.destroyAllWindows()

Class - Vivek
Class - Vivek
Class - Vedant 
Class - Vivek
Class - Vedant 
Class - Vedant 
Class - Vedant 
Class - Vedant 
Class - Vivek
Class - Vivek
Class - Vedant 
Class - Vedant 
Class - Vedant 
Class - Vivek
Class - Vedant 
Class - Vedant 
Class - Vivek
Class - Vivek
Class - Vivek
Class - Vedant 


## Here we done face recognition successfully !