# Face Mask Detection using MobileNet

In [4]:
#Defining our data generators
from __future__ import print_function
import keras
from keras.preprocessing.image import ImageDataGenerator
from keras.models import Sequential
from keras.layers import Dense, Dropout, Activation, Flatten, BatchNormalization
from keras.layers import Conv2D, MaxPooling2D
from keras.preprocessing.image import ImageDataGenerator
import os

img_rows, img_cols = 128,128
batch_size = 16

train_data_dir = './dataset/train'
validation_data_dir = './dataset/validation'

# Let's use some data augmentation and define our generators
train_datagen = ImageDataGenerator(
      rescale=1./255,
      rotation_range=30,
      shear_range=0.3,
      zoom_range=0.3,
      width_shift_range=0.4,
      height_shift_range=0.4,
      horizontal_flip=True,
      fill_mode='nearest')
 
validation_datagen = ImageDataGenerator(rescale=1./255)
 
train_generator = train_datagen.flow_from_directory(
        train_data_dir,
        target_size=(img_rows, img_cols),
        batch_size=batch_size,
        class_mode='categorical',
        shuffle=True)

validation_generator = validation_datagen.flow_from_directory(
        validation_data_dir,
        target_size=(img_rows, img_cols),
        batch_size=batch_size,
        class_mode='categorical',
        shuffle=True)

train_images = train_generator.samples
validation_images = validation_generator.samples

FileNotFoundError: [WinError 3] The system cannot find the path specified: './dataset/train'

# Loading the MobileNet

In [None]:
"""
    We will use the pretrained MobileNet to which we will add our own network of FC layers.
    We then train the new model formed for the additional layers.

"""
from keras.applications import MobileNet

# Lets load the MobileNet model without the top or FC layers
MobileNet = MobileNet(weights = 'imagenet', 
                 include_top = False, 
                 input_shape = (img_rows, img_cols, 3))

# Layers are set to be trainable as True by default but lets make them untrainable
for layer in MobileNet.layers:
    layer.trainable = False
    
# Let's check our layers 
for (i,layer) in enumerate(MobileNet.layers):
    print(str(i) + " "+ layer.__class__.__name__, layer.trainable)

In [None]:
def addTopModelMobileNet(bottom_model):
    """
    
        Creates the head of the model that will be 
        placed ontop of the bottom layers
    
    """

    top_model = bottom_model.output
    top_model = GlobalAveragePooling2D()(top_model)
    top_model = Dense(512,activation='relu')(top_model)
    top_model = Dense(128,activation='relu')(top_model)
    top_model = Dense(64,activation='relu')(top_model)
    
    top_model = Dense(2,activation='sigmoid')(top_model)
    return top_model


#Combining the model
from keras.models import Sequential
from keras.layers import Dense, Dropout, Activation, Flatten, GlobalAveragePooling2D
from keras.layers import Conv2D, MaxPooling2D, ZeroPadding2D
from keras.layers.normalization import BatchNormalization
from keras.models import Model

FC_Head = addTopModelMobileNet(MobileNet)

model = Model(inputs = MobileNet.input, outputs = FC_Head)

print(model.summary())

# Training the model

In [None]:
#Training our model
#One could do some tweakings!
from keras.optimizers import RMSprop, SGD,Adadelta
from keras.callbacks import ModelCheckpoint, EarlyStopping, ReduceLROnPlateau

                     
checkpoint = ModelCheckpoint("face_mask_detector.h5",
                             monitor="val_loss",
                             mode="min",
                             save_best_only = True,
                             verbose=1)

earlystop = EarlyStopping(monitor = 'val_loss', 
                          min_delta = 0, 
                          patience = 3,
                          verbose = 1,
                          restore_best_weights = True)

reduce_lr = ReduceLROnPlateau(monitor = 'val_loss', factor = 0.1, patience = 2, verbose = 1, min_delta = 0.0001)

callbacks = [earlystop, checkpoint, reduce_lr]

nb_train_samples = train_images
nb_validation_samples = validation_images
batch_size = 16
epochs = 20

model.compile(loss = 'categorical_crossentropy',
                  optimizer = 'rmsprop',
                  metrics = ['accuracy'])

history = model.fit_generator(
    train_generator,
    steps_per_epoch = nb_train_samples // batch_size,
    epochs = epochs,
    callbacks = callbacks,
    validation_data = validation_generator,
    validation_steps = nb_validation_samples // batch_size)


# Testing the model

In [2]:
# Loading our model
from keras.models import load_model
classifier = load_model('face_mask_detector.h5')

In [3]:
#Test on realtime video
from os import listdir
from os.path import isfile, join
import os
import cv2
import numpy as np
img_rows, img_cols = 128,128
# A function that puts the predicted class lables on the parametric image frames
def draw_label(image, point, label, font=cv2.FONT_HERSHEY_SIMPLEX,
               font_scale=0.8, thickness=1):
    size = cv2.getTextSize(label, font, font_scale, thickness)[0]
    x, y = point
    cv2.rectangle(image, (x, y - size[1]), (x + size[0], y), (255, 0, 0), cv2.FILLED)
    cv2.putText(image, label, point, font, font_scale, (255, 255, 255), thickness, lineType=cv2.LINE_AA)
    
#Define our prediction dictionary
face_classes = {0: 'with_mask', 1: 'without_mask'}
img_size = 128

detector = cv2.CascadeClassifier('haarcascade_frontalface_default.xml')

cap = cv2.VideoCapture(0)

while True:
    
    ret, frame = cap.read()
    preprocessed_faces = []           
 
    input_img = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
    img_h, img_w, _ = np.shape(frame)
    detected = detector.detectMultiScale(frame)
    faces = np.empty((len(detected), img_size, img_size, 3))
   
    if len(detected) > 0:
        
        for f in detected:
            
            # Obtain the coordinates of the detected face and draw a bounding box
            x1, y1, w, h = [v for v in f]
            cv2.rectangle(frame, (x1, y1), (x1+w,y1+h), (255, 0, 0), 2)
            face =  frame[y1:y1+h, x1:x1+w, :]
            face = cv2.resize(face, (img_rows,img_cols))
            face = face.astype("float32") / 255.0
            face = np.expand_dims(face, axis=0)
            preprocessed_faces.append(face)

        
        # Make predictions for the detected face 
        face_labels = []
        for i, d in enumerate(detected):
            preds = classifier.predict(preprocessed_faces[i])[0]
            face_labels.append(face_classes[np.argmax(preds,axis=0)])
            print(preds)
        
        # Putting labels on frames
        for i, d in enumerate(detected):
            label = "{}".format(face_labels[i])
            print(label)
            draw_label(frame, (x1,y1), label)
    
    #Display the results
    cv2.imshow("Face Mask Recognition", frame)
    if cv2.waitKey(1) == 13: #13 is the Enter Key
        break

cap.release()
cv2.destroyAllWindows()      

[0.01835509 0.9999838 ]
without_mask
[0.09040745 0.9999305 ]
without_mask
[0.32733202 0.9997234 ]
without_mask
[0.0926152 0.9999398]
without_mask
[0.03739132 0.9999584 ]
without_mask
[0.03762241 0.9999521 ]
without_mask
[0.13162513 0.99992967]
without_mask
[0.03398857 0.999959  ]
without_mask
[0.13667853 0.9999012 ]
without_mask
[0.18586437 0.99984264]
without_mask
[0.25007874 0.9998913 ]
without_mask
[0.16383754 0.9999232 ]
without_mask
[0.15484083 0.9999014 ]
without_mask
[0.02168613 0.99995637]
without_mask
[0.27787504 0.9997806 ]
without_mask
[0.18692192 0.99988365]
without_mask
[0.03021489 0.999977  ]
without_mask
[0.03826395 0.9999653 ]
without_mask
[0.03396168 0.99998486]
without_mask
[0.06239235 0.999946  ]
without_mask
[0.01497091 0.9999877 ]
without_mask
[0.01662387 0.9999901 ]
without_mask
[0.00520175 0.9999958 ]
without_mask
[0.02807541 0.99998605]
without_mask
[0.02605105 0.99998915]
without_mask
[0.09144321 0.99994385]
without_mask
[0.0666033 0.9999584]
without_mask
[0.00

[0.06777087 0.9999504 ]
without_mask
[0.02598051 0.99995613]
without_mask
[0.24238329 0.9998857 ]
without_mask
[0.11693063 0.99994683]
without_mask
[0.03425861 0.9999541 ]
without_mask
[0.03824751 0.99998045]
without_mask
[0.0029865 0.9999958]
without_mask
[0.00757478 0.9999907 ]
without_mask
[0.0090864 0.999987 ]
without_mask
[0.03807162 0.9999672 ]
without_mask
[0.01419357 0.9999722 ]
without_mask
[0.03757757 0.99996567]
without_mask
[0.0355675 0.9999504]
without_mask
[0.27367857 0.9998325 ]
without_mask
[0.0074221 0.9999914]
without_mask
[0.00700294 0.9999801 ]
without_mask
[0.02197915 0.99997556]
without_mask
[0.09342593 0.9999337 ]
without_mask
[0.00830713 0.9999831 ]
without_mask
[0.06987151 0.9999232 ]
without_mask
[0.0099327 0.9999771]
without_mask
[0.0054831 0.999982 ]
without_mask
[0.07300052 0.9999356 ]
without_mask
[0.01718876 0.99997663]
without_mask
[0.1770056  0.99986744]
without_mask
[0.02747776 0.99996674]
without_mask
[0.0423121  0.99995244]
without_mask
[0.02417536 0

<img src = 'test.png'>

<img src = 'test2.png'>

In [None]:
#You can use some images for testing also using this part of the code
from os import listdir
from os.path import isfile, join
import os
import cv2
import numpy as np

# A function that puts the predicted class lables on the parametric image frames
def draw_label(image, point, label, font=cv2.FONT_HERSHEY_SIMPLEX,
               font_scale=0.8, thickness=1):
    size = cv2.getTextSize(label, font, font_scale, thickness)[0]
    x, y = point
    cv2.rectangle(image, (x, y - size[1]), (x + size[0], y), (255, 0, 0), cv2.FILLED)
    cv2.putText(image, label, point, font, font_scale, (255, 255, 255), thickness, lineType=cv2.LINE_AA)
    
#Define our prediction dictionary
face_classes = {0: 'with_mask', 1: 'without_mask'}
img_size = 128

detector = cv2.CascadeClassifier('haarcascade_frontalface_default.xml')
    
frame = cv2.imread('test2.png')
preprocessed_faces = []           

input_img = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
img_h, img_w, _ = np.shape(frame)
detected = detector.detectMultiScale(frame)
faces = np.empty((len(detected), img_size, img_size, 3))

if len(detected) > 0:

    for f in detected:

        # Obtain the coordinates of the detected face and draw a bounding box
        x1, y1, w, h = [v for v in f]
        cv2.rectangle(frame, (x1, y1), (x1+w,y1+h), (255, 0, 0), 2)
        face =  frame[y1:y1+h, x1:x1+w, :]
        face = cv2.resize(face, (img_rows,img_cols))
        face = face.astype("float32") / 255.0
        face = np.expand_dims(face, axis=0)
        preprocessed_faces.append(face)


    # Make predictions for the detected face 
    face_labels = []
    for i, d in enumerate(detected):
        preds = classifier.predict(preprocessed_faces[i])[0]
        face_labels.append(face_classes[np.argmax(preds,axis=0)])
        print(preds)

    # Putting labels on frames
    for i, d in enumerate(detected):
        label = "{}".format(face_labels[i])
        print(label)
        draw_label(frame, (x1,y1), label)

# Display the results
cv2.imshow("Face Recognition", frame)
cv2.waitKey(0) == 13


cap.release()
cv2.destroyAllWindows()      