In [5]:
import cv2
import argparse

from ultralytics import YOLO
import supervision as sv
import numpy as np

def parse_arguments() -> argparse.Namespace:
    parser = argparse.ArgumentParser(description="YOLOv8 live")
    parser.add_argument(
        "--webcam-resolution", 
        default=[1280, 720], 
        nargs=2, 
        type=int
    )
    args = parser.parse_args(args=[])
    return args


def main():
    args = parse_arguments()
    frame_width, frame_height = args.webcam_resolution

    cap = cv2.VideoCapture(0)

    cap.set(cv2.CAP_PROP_FRAME_WIDTH, frame_width)
    cap.set(cv2.CAP_PROP_FRAME_HEIGHT, frame_height)

    model = YOLO("yolov8n.pt")

    box_annotator = sv.BoxAnnotator(
        thickness=2,
        text_thickness=2,
        text_scale=1
    )

    while True:
        ret, frame = cap.read()
        result = model(frame, agnostic_nms=True)[0]
        detections = sv.Detections.from_yolov8(result)
        labels = [
            f"{model.model.names[class_id]} {confidence:0.2f}"
            for _, _, confidence, class_id, _
            in detections
        ]
        frame = box_annotator.annotate(
            scene=frame, 
            detections=detections, 
            labels=labels
        )
        fps=cv2.CAP_PROP_FPS
        print(fps)
        cv2.putText(frame, 'fps:'.format(fps), (100,100), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (255, 0, 0), 2, cv2.LINE_AA)
        cv2.imshow("yolov8", frame)

        if (cv2.waitKey(30) == 27):
            break


if __name__ == "__main__":
    main()


0: 384x640 2 persons, 54.6ms
Speed: 4.0ms preprocess, 54.6ms inference, 6.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 33.0ms
Speed: 7.0ms preprocess, 33.0ms inference, 4.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 32.6ms
Speed: 3.8ms preprocess, 32.6ms inference, 7.2ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 34.3ms
Speed: 3.4ms preprocess, 34.3ms inference, 5.3ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 2 chairs, 50.3ms
Speed: 4.7ms preprocess, 50.3ms inference, 15.2ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 chair, 41.9ms
Speed: 12.0ms preprocess, 41.9ms inference, 7.3ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 45.1ms
Speed: 7.8ms preprocess, 45.1ms inference, 8.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 37.5ms
Speed: 6.5ms preprocess, 37.5ms inference, 5.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 38.7ms
Speed: 9.2ms preprocess, 38.7ms inference, 11.4ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 36.3ms
Speed: 9.4ms preprocess, 36.3ms inference, 16.7ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 45.7ms
Speed: 5.7ms preprocess, 45.7ms inference, 6.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 37.8ms
Speed: 6.5ms preprocess, 37.8ms inference, 8.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 40.1ms
Speed: 6.9ms preprocess, 40.1ms inference, 8.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 39.6ms
Speed: 5.5ms preprocess, 39.6ms inference, 8.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 40.4ms
Speed: 1.3ms preprocess, 40.4ms inference, 10.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 32.7ms
Speed: 8.2ms preprocess, 32.7ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 32.6ms
Speed: 10.1ms preprocess, 32.6ms inference, 15.8ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 41.1ms
Speed: 0.0ms preprocess, 41.1ms inference, 6.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 32.8ms
Speed: 4.8ms preprocess, 32.8ms inference, 9.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 37.9ms
Speed: 7.6ms preprocess, 37.9ms inference, 7.8ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 35.8ms
Speed: 5.8ms preprocess, 35.8ms inference, 15.3ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.7ms
Speed: 10.8ms preprocess, 31.7ms inference, 16.1ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 34.4ms
Speed: 8.4ms preprocess, 34.4ms inference, 18.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 37.8ms
Speed: 4.3ms preprocess, 37.8ms inference, 6.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 38.1ms
Speed: 5.9ms preprocess, 38.1ms inference, 8.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 39.9ms
Speed: 6.6ms preprocess, 39.9ms inference, 10.4ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 49.6ms
Speed: 12.9ms preprocess, 49.6ms inference, 7.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 40.2ms
Speed: 6.6ms preprocess, 40.2ms inference, 7.1ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 43.2ms
Speed: 6.5ms preprocess, 43.2ms inference, 9.7ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 44.2ms
Speed: 9.0ms preprocess, 44.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 46.9ms
Speed: 0.0ms preprocess, 46.9ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 46.9ms
Speed: 0.0ms preprocess, 46.9ms inference, 10.1ms postprocess per image at shape (1, 3, 384, 640)


5
5



0: 384x640 1 person, 40.9ms
Speed: 0.0ms preprocess, 40.9ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 13.1ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 13.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cup, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 13.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 13.1ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.2ms


5
5


Speed: 0.0ms preprocess, 31.2ms inference, 13.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 14.5ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 toothbrush, 30.2ms
Speed: 0.0ms preprocess, 30.2ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 28.7ms
Speed: 0.0ms preprocess, 28.7ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 29.7ms
Speed: 0.0ms preprocess, 29.7ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 30.2ms
Speed: 0.0ms preprocess, 30.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 cell phone, 1 toothbrush, 30.2ms
Speed: 0.0ms preprocess, 30.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 cell phone, 2 toothbrushs, 28.7ms
Speed: 0.0ms preprocess, 28.7ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 30.2ms
Speed: 0.0ms preprocess, 30.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 30.2ms
Speed: 0.0ms preprocess, 30.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 toothbrush, 29.7ms
Speed: 0.0ms preprocess, 29.7ms inference, 15.7ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 29.6ms
Speed: 0.0ms preprocess, 29.6ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 toothbrush, 30.1ms
Speed: 0.0ms preprocess, 30.1ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 29.7ms
Speed: 0.0ms preprocess, 29.7ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 29.7ms
Speed: 0.0ms preprocess, 29.7ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 28.6ms
Speed: 0.0ms preprocess, 28.6ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 30.7ms


5
5


Speed: 0.0ms preprocess, 30.7ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 cup, 1 chair, 43.4ms
Speed: 0.0ms preprocess, 43.4ms inference, 4.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cell phone, 1 toothbrush, 34.8ms
Speed: 5.3ms preprocess, 34.8ms inference, 4.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 cell phone, 1 toothbrush, 39.2ms
Speed: 5.1ms preprocess, 39.2ms inference, 4.9ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 37.3ms
Speed: 3.1ms preprocess, 37.3ms inference, 3.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 33.6ms


5
5


Speed: 4.5ms preprocess, 33.6ms inference, 5.2ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 34.3ms
Speed: 3.6ms preprocess, 34.3ms inference, 5.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 35.0ms


5
5


Speed: 3.0ms preprocess, 35.0ms inference, 5.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 36.0ms
Speed: 3.0ms preprocess, 36.0ms inference, 5.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 34.5ms
Speed: 4.0ms preprocess, 34.5ms inference, 7.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 35.6ms
Speed: 4.4ms preprocess, 35.6ms inference, 4.9ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 toothbrush, 35.6ms
Speed: 3.3ms preprocess, 35.6ms inference, 6.9ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 35.4ms
Speed: 3.0ms preprocess, 35.4ms inference, 4.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 35.0ms
Speed: 4.0ms preprocess, 35.0ms inference, 6.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 34.8ms
Speed: 3.9ms preprocess, 34.8ms inference, 4.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 toothbrush, 37.6ms
Speed: 4.0ms preprocess, 37.6ms inference, 6.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 38.8ms
Speed: 5.0ms preprocess, 38.8ms inference, 10.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 45.2ms
Speed: 0.0ms preprocess, 45.2ms inference, 8.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cell phone, 47.3ms
Speed: 0.0ms preprocess, 47.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 15.7ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 13.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 13.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.2ms


5
5


Speed: 0.0ms preprocess, 31.2ms inference, 13.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 13.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 13.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 14.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 14.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 13.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 13.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 15.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 13.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 14.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 13.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 cell phone, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 13.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 chairs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 13.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 44.3ms
Speed: 0.0ms preprocess, 44.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 13.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 13.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 13.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 13.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.2ms


5
5


Speed: 0.0ms preprocess, 31.2ms inference, 13.1ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 42.8ms
Speed: 6.2ms preprocess, 42.8ms inference, 12.8ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 34.9ms
Speed: 3.9ms preprocess, 34.9ms inference, 5.2ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 36.0ms


5
5


Speed: 3.7ms preprocess, 36.0ms inference, 4.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 45.0ms
Speed: 5.0ms preprocess, 45.0ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 43.0ms
Speed: 0.0ms preprocess, 43.0ms inference, 9.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 35.2ms
Speed: 3.7ms preprocess, 35.2ms inference, 4.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 35.1ms
Speed: 3.7ms preprocess, 35.1ms inference, 6.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 35.6ms
Speed: 4.3ms preprocess, 35.6ms inference, 5.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 37.5ms
Speed: 5.0ms preprocess, 37.5ms inference, 16.3ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 book, 46.9ms
Speed: 5.1ms preprocess, 46.9ms inference, 1.1ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 39.6ms
Speed: 14.8ms preprocess, 39.6ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 44.9ms
Speed: 0.0ms preprocess, 44.9ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 cup, 1 laptop, 28.8ms
Speed: 0.0ms preprocess, 28.8ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 cup, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 chairs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 toothbrush, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 cup, 1 laptop, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cup, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 2 toothbrushs, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 laptop, 1 toothbrush, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 laptop, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 2 toothbrushs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 2 toothbrushs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 chair, 2 toothbrushs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 toothbrushs, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 2 toothbrushs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 2 toothbrushs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 2 toothbrushs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 toothbrushs, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 toothbrushs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 cell phone, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 2 cell phones, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 cell phones, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 2 cell phones, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 2 cell phones, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 laptop, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 cell phone, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 mouse, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 1 mouse, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 laptop, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 cell phone, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 chairs, 1 remote, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)


5
5
5



0: 384x640 1 person, 1 baseball bat, 1 chair, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 1 chair, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cell phone, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cup, 1 laptop, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 baseball bat, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 baseball bat, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 baseball bat, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 baseball bat, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 1 cup, 1 chair, 1 remote, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 31.2ms


5
5


Speed: 0.0ms preprocess, 31.2ms inference, 15.7ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 1 chair, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 baseball bat, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 remote, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 toothbrush, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 laptop, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 laptop, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)


5
5
5



0: 384x640 1 person, 1 toothbrush, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 toothbrushs, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 toothbrush, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 2 toothbrushs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 remote, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 remote, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)


5
5



0: 384x640 1 person, 1 chair, 1 remote, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 remote, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 1 cell phone, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 baseball bat, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)


5
5



0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 cup, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 chair, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 tv, 1 book, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 1 remote, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 2 cell phones, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 cup, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 cup, 1 cell phone, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 1 cell phone, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)


5
5



0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 1 tv, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 cup, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 3 persons, 1 remote, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 4 persons, 2 remotes, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 remote, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 remote, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 4 persons, 1 remote, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)


5
5



0: 384x640 3 persons, 1 remote, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 3 persons, 1 remote, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 remote, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 remote, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 remote, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 4 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 remote, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 remote, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 3 persons, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 toothbrush, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 remote, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)


5
5



0: 384x640 3 persons, 1 remote, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 3 persons, 1 remote, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)


5
5



0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 toothbrush, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 toothbrush, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.2ms


5
5


Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)


5
5



0: 384x640 2 persons, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 tvs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 tvs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 3 persons, 1 tv, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 2 tvs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 tv, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 3 persons, 1 tv, 1 laptop, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 3 persons, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 2 persons, 1 chair, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)


5
5



0: 384x640 1 person, 1 chair, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 tvs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 tvs, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 tv, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 tvs, 31.2ms


5
5


Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 15.6ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 2 chairs, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 tvs, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 tvs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 tvs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cup, 2 tvs, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 tvs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 tvs, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 2 tvs, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 cup, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms


5
5


Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 31.3ms
Speed: 0.0ms preprocess, 31.3ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 31.2ms
Speed: 0.0ms preprocess, 31.2ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 tv, 40.1ms
Speed: 0.0ms preprocess, 40.1ms inference, 4.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 tv, 35.7ms
Speed: 4.0ms preprocess, 35.7ms inference, 8.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 33.8ms
Speed: 8.8ms preprocess, 33.8ms inference, 0.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 cell phone, 35.4ms
Speed: 4.3ms preprocess, 35.4ms inference, 5.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 1 cell phone, 41.8ms
Speed: 5.6ms preprocess, 41.8ms inference, 6.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 39.0ms
Speed: 4.0ms preprocess, 39.0ms inference, 5.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 37.7ms
Speed: 4.6ms preprocess, 37.7ms inference, 6.6ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 1 cell phone, 34.5ms
Speed: 6.6ms preprocess, 34.5ms inference, 5.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 37.0ms
Speed: 6.3ms preprocess, 37.0ms inference, 10.5ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 42.0ms
Speed: 5.0ms preprocess, 42.0ms inference, 6.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 1 chair, 37.1ms
Speed: 6.0ms preprocess, 37.1ms inference, 10.0ms postprocess per image at shape (1, 3, 384, 640)

0: 384x640 1 person, 1 chair, 43.0ms
Speed: 6.1ms preprocess, 43.0ms inference, 5.0ms postprocess per image at shape (1, 3, 384, 640)



5
5


0: 384x640 1 person, 38.2ms
Speed: 4.2ms preprocess, 38.2ms inference, 6.4ms postprocess per image at shape (1, 3, 384, 640)


5


KeyboardInterrupt: 