In [59]:
import numpy as np
import time
import cv2
import os

yolo_path = 'yolo-coco' # Path to the YOLO weights directory
image_path = os.path.join('images', 'living_room.jpg')
min_confidence = 0.5
threshold = 0.3

In [4]:
cv2.__version__

'3.4.2'

In [20]:
labelsPath = os.path.join(yolo_path, 'coco.names')
LABELS = open(labelsPath).read().strip().split('\n')

np.random.seed(42)
COLORS = np.random.randint(0, 255, size=(len(LABELS), 3),
    dtype='uint8')

In [21]:
weightsPath = os.path.join(yolo_path, 'yolov3.weights')
configPath = os.path.join(yolo_path, 'yolov3.cfg')

net = cv2.dnn.readNetFromDarknet(configPath, weightsPath)

In [33]:
image = cv2.imread(image_path)
(H, W) = image.shape[:2]

ln = net.getLayerNames()
ln = [ln[i[0] - 1] for i in net.getUnconnectedOutLayers()]

In [41]:
blob = cv2.dnn.blobFromImage(image, 1 / 255.0, (416, 416 ),
    swapRB=True, crop=True)
net.setInput(blob)
start = time.time()
layerOutputs = net.forward(ln)
end = time.time()

print("[INFO] YOLO took {:.6f} seconds".format(end - start))

[INFO] YOLO took 0.637063 seconds


In [60]:
boxes = []
confidences = []
classIDs = []

for output in layerOutputs:
    for detection in output:
        scores = detection[5:]
        classID = np.argmax(scores)
        confidence = scores[classID]
        
        if confidence > min_confidence:
            box = detection[0:4] * np.array([W, H, W, H])
            (centerX, centerY, width, height) = box.astype('int')
            
            x = int(centerX - (width / 2))
            y = int(centerY - (height / 2))
            
            boxes.append([x, y, int(width), int(height)])
            confidences.append(float(confidence))
            classIDs.append(classID)

In [62]:
idxs = cv2.dnn.NMSBoxes(boxes, confidences, min_confidence,
    threshold)

In [65]:
if len(idxs) > 0:
    for i in idxs.flatten():
        (x, y) = (boxes[i][0], boxes[i][1])
        (w, h) = (boxes[i][2], boxes[i][3])
        
        color = [int(c) for c in COLORS[classIDs[i]]]
        cv2.rectangle(image, (x, y), (x + w, y + h), color, 2)
        text = "{}: {:.4f}".format(LABELS[classIDs[i]], confidences[i])
        cv2.putText(image, text, (x, y - 5), cv2.FONT_HERSHEY_SIMPLEX,
            0.5, color, 2)

In [67]:
cv2.imwrite('output.png', image)

True