In [1]:

import os
import cv2
import time
from tqdm import tqdm
import numpy as np
import tensorflow as tf
from sklearn.model_selection import train_test_split
from tensorflow.keras.models import Sequential, load_model
from tensorflow.keras.layers import Conv2D, Dense, MaxPooling2D, Flatten, Activation, Dropout

In [2]:
img_size = 100
datadir = r'F:\cvpr\Dataset'
CATEGORIES = os.listdir(datadir)
print(CATEGORIES)

['mask_weared_incorrect', 'without_mask', 'with_mask']


In [3]:
# Define two empty list for contain image data
x, y = [], []
   
def PreProcess():
    for category in CATEGORIES:
        path = os.path.join(datadir, category)
        classIndex = CATEGORIES.index(category)
        print(path)
        for imgs in tqdm(os.listdir(path)):
            img_arr = cv2.imread(os.path.join(path, imgs))
            
            # resize the image
            resized_array = cv2.resize(img_arr, (img_size, img_size))
            cv2.imshow("images", resized_array)
            cv2.waitKey(1)
            resized_array = resized_array/255.0
            x.append(resized_array)
            y.append(classIndex)
            
PreProcess()
cv2.destroyAllWindows()

F:\cvpr\Dataset\mask_weared_incorrect


100%|██████████████████████████████████████████████████████████████████████████████| 2994/2994 [00:46<00:00, 64.12it/s]


F:\cvpr\Dataset\without_mask


100%|██████████████████████████████████████████████████████████████████████████████| 2994/2994 [00:46<00:00, 64.26it/s]


F:\cvpr\Dataset\with_mask


100%|██████████████████████████████████████████████████████████████████████████████| 2994/2994 [00:54<00:00, 55.33it/s]


In [4]:
# Split data for training and testing
X_train, X_test, y_train, y_test = train_test_split(x, y, test_size=0.20, random_state=42)

In [5]:
# Convert and resize the data to a numpy array
X_train = np.array(X_train).reshape(-1, img_size, img_size, 3)
y_train = np.array(y_train)
X_test = np.array(X_test).reshape(-1, img_size, img_size, 3)
y_test = np.array(y_test)

In [6]:
batch_size = 32
epochs = 15

In [7]:
# Create the model architecture

model = Sequential()

model.add(Conv2D(64,(3, 3), input_shape=(img_size, img_size, 3)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size = (2, 2)))

model.add(Conv2D(256, (3, 3)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size = (2, 2)))

model.add(Conv2D(128, (3, 3)))
model.add(Activation('relu'))
model.add(Dropout(0.25))

model.add(Conv2D(32, (3, 3)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size = (2, 2)))

model.add(Dropout(0.25))
model.add(Flatten())
model.add(Dense(100, activation='relu'))
model.add(Dense(16, activation='relu'))


model.add(Dense(len(CATEGORIES)))
model.add(Activation('softmax'))

# compile the model

model.compile(optimizer='adam', loss = 'sparse_categorical_crossentropy', metrics=['accuracy'])
model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d (Conv2D)             (None, 98, 98, 64)        1792      
                                                                 
 activation (Activation)     (None, 98, 98, 64)        0         
                                                                 
 max_pooling2d (MaxPooling2D  (None, 49, 49, 64)       0         
 )                                                               
                                                                 
 conv2d_1 (Conv2D)           (None, 47, 47, 256)       147712    
                                                                 
 activation_1 (Activation)   (None, 47, 47, 256)       0         
                                                                 
 max_pooling2d_1 (MaxPooling  (None, 23, 23, 256)      0         
 2D)                                                    

In [8]:
t1 = time.time()

# fit the model
model.fit(X_train, y_train, batch_size = batch_size, epochs=5, validation_split=0.3, verbose = 1)
model.save('{}.h5'.format("model"))

t2 = time.time()
print('Time taken: ',t2-t1)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
Time taken:  1110.2753925323486


In [9]:
validation_loss, validation_accuracy = model.evaluate(X_test, y_test)



In [None]:
import cv2
import mediapipe as mp
import numpy as np
import tensorflow as tf
from tensorflow.keras.models import load_model

# Load the model
model = load_model('model.h5')

# Define mediapipe Face detector

face_detection = mp.solutions.face_detection.FaceDetection()

# Detection function



def get_detection(frame):

    height, width, channel = frame.shape

    # Convert frame BGR to RGB colorspace

    imgRGB = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
    # Detect results from the frame
    
    result = face_detection.process(imgRGB)


    try:
        for count, detection in enumerate(result.detections):

            # print(detection)

        
            # Extract bounding box information 
            
            box = detection.location_data.relative_bounding_box

            x, y, w, h = int(box.xmin*width), int(box.ymin * height), int(box.width*width), int(box.height*height)
            
    # If detection is not available then pass 
    except:
        pass

    return x, y, w, h

CATEGORIES = ['no_mask', 'mask']
cap = cv2.VideoCapture(0)
while True:
    _, frame = cap.read()
    img = frame.copy()
    try:
        x, y, w, h = get_detection(frame)
        
        crop_img = img[y:y+h, x:x+w]
        
        crop_img = cv2.resize(crop_img, (100, 100))
        
        crop_img = np.expand_dims(crop_img, axis=0)
        
        # get the prediction from the model.
        prediction = model.predict(crop_img)
        print(prediction)
        index = np.argmax(prediction)
        res = CATEGORIES[index]
        if index == 0:
            color = (0, 0, 255)
        else:
            color = (0, 255, 0)
        cv2.rectangle(frame, (x, y), (x+w, y+h), color, 2)
        cv2.putText(frame, res, (x, y-10), cv2.FONT_HERSHEY_SIMPLEX,
                                 0.8, color, 2, cv2.LINE_AA)

    except:
        pass
    
    cv2.imshow("frame", frame)
    if cv2.waitKey(1) == ord('q'):
        break
    
cap.release()
cv2.destroyAllWindows()

[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[3.5313791e-22 1.0000000e+00 1.0915191e-37]]
[[0. 1. 0.]]
[[6.0467080e-24 1.0000000e+00 6.4930414e-38]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[8.1063862e-21 1.0000000e+00 9.3073264e-20]]
[[1.0562868e-23 1.0000000e+00 1.2946667e-26]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[2.1534978e-38 1.0000000e+00 1.0237471e-27]]
[[3.823703e-33 1.000000e+00 0.000000e+00]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0.0000000e+00 1.0000000e+00 2.2065112e-37]]
[[0. 1. 0.]]
[[6.4215666e-28 1.0000000e+00 5.7392010e-34]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[1.43198e-38 1.00000e+00 0.00000e+00]]
[[3.2315190e-27 1.0000000e+00 9.1335294e-30]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[6.061106e-28 1.000000e+00 0.000000e+00]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[1.0141031e-36 1.0000000e+00 3.8904471e-38]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[3.5378117e-29 1.

[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0.0000000e+00 1.0000000e+00 1.3643216e-38]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[1.1004085e-35 1.0000000e+00 0.0000000e+00]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[8.616587e-25 1.000000e+00 0.000000e+00]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[3.2527263e-29 1.0000000e+00 0.0000000e+00]]
[[0. 1. 0.]]
[[1.8794609e-38 1.0000000e+00 0.0000000e+00]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[4.6941203e-37 1.0000000e+00 0.0000000e+00]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0.0000000e+00 1.0000000e+00 1.8936917e-35]]
[[5.1526443e-32 1.0000000e+00 3.1281576e-33]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[4.8070416e-26 1.0000000e+00 2.6457514e-35]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0.

[[0. 1. 0.]]
[[8.3254525e-35 1.0000000e+00 0.0000000e+00]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0.000000e+00 1.000000e+00 4.374153e-28]]
[[0. 1. 0.]]
[[0.0000000e+00 1.0000000e+00 3.4056017e-38]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0.0000000e+00 1.0000000e+00 8.8699267e-38]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0.0000000e+00 1.0000000e+00 2.3270933e-37]]
[[0. 1. 0.]]
[[2.7005055e-37 1.0000000e+00 1.2379335e-38]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[4.8798440e-23 1.0000000e+00 1.3341888e-28]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0.0000000e+00 1.0000000e+00 2.0752416e-34]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[1.2678109e-33 1.0000000e+00 4.1640745e-31]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0.0000000e+00 1.0000000e+00 3.7429024e-32]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0.0000000e+00 1.0000000e+00 3.2652328e-29]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[6.5828304e-29 1.0000000e+00 0.0000000e+00]]
[[5.92729

[[2.6457595e-29 1.8199691e-08 1.0000000e+00]]
[[9.999999e-01 8.754020e-31 8.645239e-08]]
[[0.0000000e+00 1.0000000e+00 5.2937226e-25]]
[[0.0000000e+00 1.0000000e+00 2.1926201e-26]]
[[0. 1. 0.]]
[[1.4497967e-12 1.0000000e+00 1.9736686e-14]]
[[0. 1. 0.]]
[[0.000000e+00 1.000000e+00 7.010092e-20]]
[[2.4168827e-19 1.0000000e+00 3.2697191e-22]]
[[0.0000000e+00 1.0000000e+00 1.5337069e-32]]
[[3.3872865e-20 1.0000000e+00 1.6946535e-13]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0. 1. 0.]]
[[0.0000000e+00 1.0000000e+00 2.4976858e-20]]
[[0.0000000e+00 1.0000000e+00 1.8562202e-29]]
[[0.0000000e+00 1.0000000e+00 1.2804869e-33]]