# by Hesham Gamal

github:https://github.com/HesahmGamal

linkedin:https://www.linkedin.com/in/hesham-gamal-11304019b/

In [None]:
from social_distancing_config import NMS_THRESH
from social_distancing_config import MIN_CONF
import numpy as np
import cv2


def detect_people(frame, net, ln, personIdx=0):
    # grab the dimensions of the frame and  initialize the list of
    # results
    (H, W) = frame.shape[:2]
    results = []

    # construct a blob from the input frame and then perform a forward
    # pass of the YOLO object detector, giving us our bounding boxes
    # and associated probabilities
    blob = cv2.dnn.blobFromImage(frame, 1 / 255.0, (416, 416),
        swapRB=True, crop=False)
    net.setInput(blob)
    layerOutputs = net.forward(ln)
#     print(layerOutputs)

    # initialize our lists of detected bounding boxes, centroids, and
    # confidences, respectively
    boxes = []
    centroids = []
    confidences = []
    
    # loop over each of the layer outputs
    for output in layerOutputs:
        # loop over each of the detections
        for detection in output:
            # extract the class ID and confidence (i.e., probability)
            # of the current object detection
            scores = detection[5:]
            
            classID = np.argmax(scores)
           
            confidence = scores[classID]
            

            # filter detections by (1) ensuring that the object
            # detected was a person and (2) that the minimum
            # confidence is met
            
            if classID == personIdx and confidence > MIN_CONF:
                
                # scale the bounding box coordinates back relative to
                # the size of the image, keeping in mind that YOLO

                # actually returns the center (x, y)-coordinates of
                # the bounding box followed by the boxes' width and
                # height
                box = detection[0:4] * np.array([W, H, W, H])
                (centerX, centerY, width, height) = box.astype("int")

                # use the center (x, y)-coordinates to derive the top
                # and and left corner of the bounding box
                x = int(centerX - (width / 2))
                y = int(centerY - (height / 2))

                # update our list of bounding box coordinates,
                # centroids, and confidences
                boxes.append([x, y, int(width), int(height)])
                centroids.append((centerX, centerY))
                confidences.append(float(confidence))

    # apply non-maxima suppression to suppress weak, overlapping
    # bounding boxes
    idxs = cv2.dnn.NMSBoxes(boxes, confidences, MIN_CONF, NMS_THRESH)

    # ensure at least one detection exists
    if len(idxs) > 0:
        # loop over the indexes we are keeping
        for i in idxs.flatten():
            # extract the bounding box coordinates
            (x, y) = (boxes[i][0], boxes[i][1])
            (w, h) = (boxes[i][2], boxes[i][3])

            # update our results list to consist of the person
            # prediction probability, bounding box coordinates,
            # and the centroid
            r = (confidences[i], (x, y, x + w, y + h), centroids[i])
            results.append(r)


 
    # return the list of results
    return results

In [6]:
# import the necessary packages
import social_distancing_config as config
# from pinoydatascientist.detection import detect_people
from scipy.spatial import distance as dist
import numpy as np
import argparse
import imutils
import cv2
import os
import time



# load the COCO class labels our YOLO model was trained on
labelsPath = os.path.sep.join([config.MODEL_PATH, "coco.names"])
LABELS =  open(labelsPath).read().strip().split("\n")




# derive the paths to the YOLO weights and model configuration
# #yolov3
# weightsPath = os.path.sep.join([config.MODEL_PATH, "yolov3.weights"])
# configPath = os.path.sep.join([config.MODEL_PATH, "yolov3.cfg"])

# #yolov3-tiny
# weightsPath = os.path.sep.join([config.MODEL_PATH, "yolov3-tiny.weights"])
# configPath = os.path.sep.join([config.MODEL_PATH, "yolov3-tiny.cfg"])

# #yolov4
# weightsPath = os.path.sep.join([config.MODEL_PATH, "yolov4.weights"])
# configPath = os.path.sep.join([config.MODEL_PATH, "yolov4.cfg"])

#yolov4-tiny (the best in acc and performance)
weightsPath = os.path.sep.join([config.MODEL_PATH, "yolov4-tiny.weights"])
configPath = os.path.sep.join([config.MODEL_PATH, "yolov4-tiny.cfg"])

# load our YOLO object detector trained on COCO dataset (80 classes)
print("[INFO] loading YOLO from disk...")
net = cv2.dnn.readNetFromDarknet(configPath, weightsPath)

# check if we are going to use GPU
if config.USE_GPU:
    # set CUDA as the preferable backend and target
    print("[INFO] setting preferable backend and target to CUDA...")
    net.setPreferableBackend(cv2.dnn.DNN_BACKEND_CUDA)
    net.setPreferableTarget(cv2.dnn.DNN_TARGET_CUDA)

# determine only the *output* layer names that we need from YOLO

ln = net.getLayerNames()

ln = [ln[i - 1] for i in net.getUnconnectedOutLayers()]

# initialize the video stream and pointer to output video file
print("[INFO] accessing video stream...")
vs = cv2.VideoCapture('pedestrians.mp4')
writer = None

# loop over the frames from the video stream
while True:
    # read the next frame from the file
    time_st=time.time()
    (grabbed, frame) = vs.read()

    # if the frame was not grabbed, then we have reached the end
    # of the stream
    if not grabbed:
        break

    # resize the frame and then detect people (and only people) in it
    frame = imutils.resize(frame, width=700)
    results = detect_people(frame, net, ln,personIdx=LABELS.index("person"))

    # initialize the set of indexes that violate the minimum social
    # distance
    violate = set()

    # ensure there are *at least* two people detections (required in
    # order to compute our pairwise distance maps)
    if len(results) >= 2:
        # extract all centroids from the results and compute the
        # Euclidean distances between all pairs of the centroids
        centroids = np.array([r[2] for r in results])
        D = dist.cdist(centroids, centroids, metric="euclidean")

        # loop over the upper triangular of the distance matrix
        for i in range(0, D.shape[0]):
            for j in range(i + 1, D.shape[1]):
                # check to see if the distance between any two
                # centroid pairs is less than the configured number
                # of pixels
                if D[i, j] < config.MIN_DISTANCE:
                    # update our violation set with the indexes of
                    # the centroid pairs
                    violate.add(i)
                    violate.add(j)

    # loop over the results
    for (i, (prob, bbox, centroid)) in enumerate(results):
        # extract the bounding box and centroid coordinates, then
        # initialize the color of the annotation
        (startX, startY, endX, endY) = bbox
        (cX, cY) = centroid
        color = (0, 255, 0)

        # if the index pair exists within the violation set, then
        # update the color
        if i in violate:
            color = (0, 0, 255)

        # draw (1) a bounding box around the person and (2) the
        # centroid coordinates of the person,
        cv2.rectangle(frame, (startX, startY), (endX, endY), color, 2)
        cv2.circle(frame, (cX, cY), 5, color, 1)

    # draw the total number of social distancing violations on the
    # output frame
    text = "Social Distancing Violations: {}".format(len(violate))
    cv2.putText(frame, text, (10, frame.shape[0] - 25),
        cv2.FONT_HERSHEY_SIMPLEX, 0.85, (0, 0, 255), 3)


    cv2.imshow("Frame", frame)
    key = cv2.waitKey(1) & 0xFF
    fps=(1/(time.time()-time_st))
    print(fps)
    # if the `q` key was pressed, break from the loop
    if key == ord("q"):
        break

 
vs.release()
cv2.destroyAllWindows()

[INFO] loading YOLO from disk...
[INFO] accessing video stream...
4.752224682131616
7.8951010251216935
9.033101743171823
9.370777981831749
8.952393962161054
7.833436675905244
8.718788521301695
8.95252772115559
9.283870168044906
9.734612929804
8.643914663501171
9.734454780073897
9.641169452994086
9.198862178397619
9.459328287521087
8.795431907447057
8.952374854059546
9.734499965186716
9.641147291525876
9.033296289595878
9.734409595380551
8.952565938745323
9.370715174587854
9.198942878134904
9.114961013221603
8.643861221882181
9.033257379640677
9.458965633111648
8.873265776724704
9.19898322853452
9.284034565802521
9.198842003684534
9.37079891776681
8.021250757794526
9.549198485534946
9.198942878134904
9.032576509681212
8.795745466136527
9.5495463497376
9.734725897043123
9.829931542324935
9.549415897691595
9.283808520386819
9.28407566615166
9.032946112065884
9.37100828226273
8.021327458337636
9.283972915961122
8.952489503892151
8.873247004914415
9.641036485713038
9.459434955874958
8.95235