In [1]:
import cv2 
import mediapipe as mp
import time


class faceDetector():
    def __init__(self, minDetectionCon=0.5, complexity=1):

        self.minDetectionCon = minDetectionCon

        self.mpFaceDetection = mp.solutions.face_detection
        self.mpDraw = mp.solutions.drawing_utils
        self.faceDetection = self.mpFaceDetection.FaceDetection(self.minDetectionCon)

    def findFaces(self, img, draw=True):
        imgRGB = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
        self.results = self.faceDetection.process(imgRGB)
        #print(self.results)

        bboxs = []
        if self.results.detections:
            for id, detection in enumerate(self.results.detections):
                bboxC = detection.location_data.relative_bounding_box
                ih, iw, ic = img.shape
                bbox = int(bboxC.xmin * iw), int(bboxC.ymin * ih), \
                    int(bboxC.width * iw), int(bboxC.height * ih)
                bboxs.append([id, bbox, detection.score])
                if draw:
                    img = self.fancyDraw(img, bbox)
                
                cv2.putText(img, f'{int(detection.score[0] * 100)}%', (bbox[0], bbox[1] - 20), cv2.FONT_HERSHEY_PLAIN, 2, (255, 0, 255), 2)


        return img, bboxs

    def fancyDraw(self, img, bbox, l=30, t=6, rt=1):
        x, y, w, h = bbox
        x1, y1 = x + w, y + h

        cv2.rectangle(img, bbox, (255, 0, 255), rt)
        # Top Left x, y
        cv2.line(img, (x, y), (x+l, y), (255, 0, 255), t)
        cv2.line(img, (x, y), (x, y+l), (255, 0, 255), t)
        # Top Right x1, y
        cv2.line(img, (x1, y), (x1-l, y), (255, 0, 255), t)
        cv2.line(img, (x1, y), (x1, y+l), (255, 0, 255), t)
        # Bottom Left x, y1
        cv2.line(img, (x, y1), (x+l, y1), (255, 0, 255), t)
        cv2.line(img, (x, y1), (x, y1-l), (255, 0, 255), t)
        # Bottom Right x1, y1
        cv2.line(img, (x1, y1), (x1-l, y1), (255, 0, 255), t)
        cv2.line(img, (x1, y1), (x1, y1-l), (255, 0, 255), t)

        return img




def main():
    cap = cv2.VideoCapture(0)
    #cap = cv2.VideoCapture('vid5.mp4')
    pTime = 0
    detector = faceDetector()

    while True:
        success, img = cap.read()
        img, bboxs = detector.findFaces(img, False)
        print(bboxs)

        cTime = time.time()
        fps = 1/(cTime - pTime)
        pTime = cTime
        cv2.putText(img, f'FPS: {int(fps)}', (20, 70), cv2.FONT_HERSHEY_PLAIN, 3, (255, 0, 0), 2)

        cv2.imshow('Image', img)
        cv2.waitKey(1)



if __name__ == '__main__':
    main()

INFO: Created TensorFlow Lite XNNPACK delegate for CPU.


[]
[]
[]
[[0, (415, 295, 309, 309), [0.7945865988731384]]]
[[0, (403, 286, 343, 343), [0.9257152676582336]]]
[[0, (405, 285, 348, 348), [0.9265632629394531]]]
[[0, (404, 285, 348, 348), [0.9315089583396912]]]
[[0, (405, 284, 348, 348), [0.9311674237251282]]]
[[0, (403, 286, 349, 349), [0.9314574599266052]]]
[[0, (414, 278, 344, 344), [0.9139159917831421]]]
[[0, (412, 279, 344, 344), [0.9293625950813293]]]
[[0, (418, 280, 336, 336), [0.9251719117164612]]]
[[0, (415, 278, 339, 339), [0.9143458008766174]]]
[[0, (420, 282, 335, 335), [0.9235662221908569]]]
[[0, (413, 282, 337, 337), [0.9237804412841797]]]
[[0, (415, 286, 335, 335), [0.9375365376472473]]]
[[0, (414, 283, 334, 334), [0.940852701663971]]]
[[0, (415, 282, 332, 332), [0.9359052777290344]]]
[[0, (411, 280, 334, 334), [0.9290897250175476]]]
[[0, (411, 284, 334, 334), [0.9390571713447571]]]
[[0, (412, 280, 338, 338), [0.9401260018348694]]]
[[0, (415, 282, 340, 340), [0.9404010772705078]]]
[[0, (408, 276, 348, 348), [0.953859984874

KeyboardInterrupt: 