# AIM - Detect whether person wearing mask or not using CNN and OpenCV
## Following steps will be followed for achieving the aim:
## 1) Loading Dataset, converting images to array.
## 2) Model Building using Pre-Trained model VGG-16 (Transfer Learning)
## 3) Creating functions using OpenCV to detect mask using Model.

In [5]:
import cv2
import os
import tensorflow

In [2]:
categories=["mask","no_mask"]

In [3]:
# for accessing image path and its label.
data=[]
for i in categories:
    label=categories.index(i)
    for file in os.listdir(i):
        imgpath=os.path.join(i,file)
        img=cv2.imread(imgpath)
        img=cv2.resize(img,(224,224))
        data.append([img,label])
        

In [4]:
len(data)

1263

In [5]:
#Data is equally divided 1st no mask and then with mask to avoid confusion for model we'll shuffle the data.
import random
random.shuffle(data)

In [6]:
# divide data in x and y 
x=[]
y=[]
for i,j in data:
    x.append(i)
    y.append(j)

In [7]:
print(len(x))
len(y)

1263


1263

In [8]:
# convert data to array
import numpy as np
x=np.array(x)
y=np.array(y)

In [9]:
x.shape

(1263, 224, 224, 3)

In [10]:
y.shape

(1263,)

In [11]:
x=x/255

In [12]:
x

array([[[[0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627],
         ...,
         [0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627]],

        [[0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627],
         ...,
         [0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627]],

        [[0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627],
         ...,
         [0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627]],

        ...,

        [[0.01568627, 0.01568627, 0.01568627],
         [0.01568627, 0.01568627, 0.01568627]

In [13]:
from sklearn.model_selection import train_test_split
x_train,x_test,y_train,y_test=train_test_split(x,y,test_size=0.2)

In [14]:
x_train.shape

(1010, 224, 224, 3)

In [15]:
y_train.shape

(1010,)

# Model Building

In [16]:
from keras.applications.vgg16 import VGG16

In [17]:
vgg=VGG16(include_top=True)

In [18]:
vgg.summary()

Model: "vgg16"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_1 (InputLayer)        [(None, 224, 224, 3)]     0         
                                                                 
 block1_conv1 (Conv2D)       (None, 224, 224, 64)      1792      
                                                                 
 block1_conv2 (Conv2D)       (None, 224, 224, 64)      36928     
                                                                 
 block1_pool (MaxPooling2D)  (None, 112, 112, 64)      0         
                                                                 
 block2_conv1 (Conv2D)       (None, 112, 112, 128)     73856     
                                                                 
 block2_conv2 (Conv2D)       (None, 112, 112, 128)     147584    
                                                                 
 block2_pool (MaxPooling2D)  (None, 56, 56, 128)       0     

In [21]:
from keras import Sequential

In [22]:
model=Sequential()

In [23]:
for layer in vgg.layers[0:-1]:
    model.add(layer)

In [24]:
model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 block1_conv1 (Conv2D)       (None, 224, 224, 64)      1792      
                                                                 
 block1_conv2 (Conv2D)       (None, 224, 224, 64)      36928     
                                                                 
 block1_pool (MaxPooling2D)  (None, 112, 112, 64)      0         
                                                                 
 block2_conv1 (Conv2D)       (None, 112, 112, 128)     73856     
                                                                 
 block2_conv2 (Conv2D)       (None, 112, 112, 128)     147584    
                                                                 
 block2_pool (MaxPooling2D)  (None, 56, 56, 128)       0         
                                                                 
 block3_conv1 (Conv2D)       (None, 56, 56, 256)       2

In [25]:
for layer in model.layers:
    layer.trainable=False

In [26]:
model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 block1_conv1 (Conv2D)       (None, 224, 224, 64)      1792      
                                                                 
 block1_conv2 (Conv2D)       (None, 224, 224, 64)      36928     
                                                                 
 block1_pool (MaxPooling2D)  (None, 112, 112, 64)      0         
                                                                 
 block2_conv1 (Conv2D)       (None, 112, 112, 128)     73856     
                                                                 
 block2_conv2 (Conv2D)       (None, 112, 112, 128)     147584    
                                                                 
 block2_pool (MaxPooling2D)  (None, 56, 56, 128)       0         
                                                                 
 block3_conv1 (Conv2D)       (None, 56, 56, 256)       2

In [27]:
from keras.layers import Dense

In [28]:
model.add(Dense(1,activation='sigmoid'))

In [29]:
model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 block1_conv1 (Conv2D)       (None, 224, 224, 64)      1792      
                                                                 
 block1_conv2 (Conv2D)       (None, 224, 224, 64)      36928     
                                                                 
 block1_pool (MaxPooling2D)  (None, 112, 112, 64)      0         
                                                                 
 block2_conv1 (Conv2D)       (None, 112, 112, 128)     73856     
                                                                 
 block2_conv2 (Conv2D)       (None, 112, 112, 128)     147584    
                                                                 
 block2_pool (MaxPooling2D)  (None, 56, 56, 128)       0         
                                                                 
 block3_conv1 (Conv2D)       (None, 56, 56, 256)       2

In [30]:
model.compile(optimizer='Adam', loss='binary_crossentropy', metrics=['accuracy'])

In [31]:
model.fit(x_train,y_train,epochs=5,validation_data=(x_test,y_test))

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


<keras.callbacks.History at 0x2926de3efd0>

In [53]:
model.save('vgg.h5')

In [1]:
# Model trained, we can predict whether person wearing mask or not using model and OpenCV

In [17]:
from tensorflow.keras.models import load_model

In [18]:
model=load_model('vgg.h5')

In [19]:
cap=cv2.VideoCapture(0)

In [20]:
def detect_mask(img):
    y_pred= model.predict(img.reshape(1,224,224,3))
    return y_pred[0][0]

In [21]:
def draw_label(img,text,pos,col):
    text_size= cv2.getTextSize(text,cv2.FONT_HERSHEY_SIMPLEX,1,cv2.FILLED)
    end_x = pos[0] + text_size[0][0] + 2
    end_y = pos[1] + text_size[0][1] - 2
    
    cv2.rectangle(img,pos,(end_x,end_y),col,cv2.FILLED)
    cv2.putText(img,text,pos,cv2.FONT_HERSHEY_SIMPLEX,1,(0,0,0),1,cv2.LINE_AA)

In [22]:
haar = cv2.CascadeClassifier("haarcascade_frontalface_default.xml")

In [25]:
def face_detect(img):
    coords=haar.detectMultiScale(img)
    return coords

In [28]:
while True:
    ret, frame = cap.read()
    
    img= cv2.resize(frame,(224,224))
    y_pred = detect_mask(img)
    
    coords= face_detect(cv2.cvtColor(frame,cv2.COLOR_BGR2GRAY))
    for x,y,w,h in coords:
        cv2.rectangle(frame,(x,y),(x+w,y+h),(255,0,0),3)
    
    if y_pred > 0.9:
        draw_label(frame,"No mask", (30,30),(0,0,255))
    else:
        draw_label(frame,"Mask", (30,30),(0,255,0))
        
    
    cv2.imshow("window",frame)
    if cv2.waitKey(1) & 0xFF== ord('p'):
        break
cv2.destroyAllWindows()

