In [2]:
from ultralytics import YOLO
import cv2
import cvzone
import math

In [4]:
# Open video file for reading
cap = cv2.VideoCapture(0)

In [6]:
# Load YOLO model for detecting objects related to personal protective equipment (PPE)
model = YOLO("C:/Users/arka/OneDrive/Arka_PhD/PPE_DETECTION/ppe.pt")

In [8]:
# Class names for different objects detected by the model
classNames = ['Hardhat', 'Mask', 'NO-Hardhat', 'NO-Mask', 'NO-Safety Vest', 'Person', 'Safety Cone',
              'Safety Vest', 'Machinery', 'Vehicle']

# Default color for drawing bounding boxes
myColor = (0, 0, 255)

# Open video capture (make sure to initialize the 'cap' variable)
cap = cv2.VideoCapture(0)  # Use 0 for webcam or provide a video file path

# Main loop to process each frame of the video
while cap.isOpened():  # Ensure video capture is opened correctly
    # Read a frame from the video
    success, img = cap.read()

    # Break the loop if frame is not captured correctly
    if not success:
        print("Failed to read frame. Exiting...")
        break

    # Perform object detection using YOLO on the current frame
    results = model(img, stream=True)

    # Process the results of object detection
    for r in results:
        # Extract bounding box information for each detected object
        boxes = r.boxes
        for box in boxes:
            x1, y1, x2, y2 = box.xyxy[0]
            x1, y1, x2, y2 = int(x1), int(y1), int(x2), int(y2)
            w, h = x2 - x1, y2 - y1

            # Calculate confidence and class index
            conf = math.ceil((box.conf[0] * 100)) / 100
            cls = int(box.cls[0])
            currentClass = classNames[cls]

            # Set color based on the class of the detected object
            if conf > 0.5:
                if currentClass == 'NO-Hardhat' or currentClass == 'NO-Safety Vest' or currentClass == "NO-Mask":
                    myColor = (0, 0, 255)  # Red for non-compliance
                elif currentClass == 'Hardhat' or currentClass == 'Safety Vest' or currentClass == "Mask":
                    myColor = (0, 255, 0)  # Green for compliance
                else:
                    myColor = (255, 0, 0)  # Blue for other objects

                # Display the class name and confidence on the image
                cvzone.putTextRect(img, f'{classNames[cls]} {conf}',
                                   (max(0, x1), max(35, y1)), scale=1, thickness=1, colorB=myColor,
                                   colorT=(255, 255, 255), colorR=myColor, offset=5)
                
                # Draw bounding box around the detected object
                cv2.rectangle(img, (x1, y1), (x2, y2), myColor, 3)

    # Display the annotated image
    cv2.imshow("Image", img)

    # Check for the 'q' key to break the loop
    if cv2.waitKey(1) & 0xFF == ord('q'):
        break

# After the loop, release the video capture and close windows
cap.release()
cv2.destroyAllWindows()


0: 480x640 1 NO-Hardhat, 1 NO-Mask, 1 Person, 1360.7ms
Speed: 7.6ms preprocess, 1360.7ms inference, 439.6ms postprocess per image at shape (1, 3, 480, 640)

0: 480x640 1 NO-Hardhat, 1 NO-Mask, 1 Person, 1229.0ms
Speed: 8.0ms preprocess, 1229.0ms inference, 1.0ms postprocess per image at shape (1, 3, 480, 640)

0: 480x640 1 NO-Hardhat, 1 NO-Mask, 1 Person, 1216.4ms
Speed: 4.5ms preprocess, 1216.4ms inference, 0.5ms postprocess per image at shape (1, 3, 480, 640)

0: 480x640 1 NO-Hardhat, 1 NO-Mask, 1 Person, 1 machinery, 1191.0ms
Speed: 3.0ms preprocess, 1191.0ms inference, 1.5ms postprocess per image at shape (1, 3, 480, 640)

0: 480x640 1 NO-Hardhat, 1 NO-Mask, 1 Person, 1222.7ms
Speed: 3.0ms preprocess, 1222.7ms inference, 2.0ms postprocess per image at shape (1, 3, 480, 640)

0: 480x640 1 NO-Hardhat, 1 NO-Mask, 1 Person, 1224.4ms
Speed: 3.0ms preprocess, 1224.4ms inference, 1.0ms postprocess per image at shape (1, 3, 480, 640)

0: 480x640 1 NO-Hardhat, 1 NO-Mask, 1 Person, 1204.5ms