In [None]:
from typing import Any, List
from ultralytics import YOLO
from inference import InferencePipeline
from inference.core.interfaces.stream.sinks import render_boxes
from inference.core.interfaces.camera.entities import VideoFrame
import torch
import numpy as np

class MyModel:

    def __init__(self, weights_path: str):
        # Load the YOLO model
        self._model = YOLO(weights_path)
        print("Modèle chargé avec succès")

    def infer(self, video_frames: List[VideoFrame]) -> List[Any]:
        print('Video frames:', len(video_frames))
        
        # Convert the list of images to the format expected by YOLO
        images = [v.image for v in video_frames]

        # Convert images to numpy arrays
        images_np = [np.array(img) for img in images]

        # Make predictions
        results = self._model(images_np)

        # Extract the necessary data from results
        predictions = []
        for result in results:
            boxes = result.boxes.xyxy.tolist() if result.boxes else []
            scores = result.boxes.conf.tolist() if result.boxes else []
            class_indices = result.boxes.cls.tolist() if result.boxes else []
            
            # Create a dictionary  for each prediction
            prediction = {
                'boxes': boxes,
                'scores': scores,
                'class_indices': class_indices
            }
            predictions.append(prediction)

        print("Predictions made:", predictions)
        return predictions
        # for result in results:
        #     if hasattr(result, 'boxes') and hasattr(result, 'scores') and hasattr(result, 'class_indices'):
        #         boxes = result.boxes.xyxy.tolist()  # Assuming xyxy format, adjust if necessary
        #         scores = result.scores.tolist()
        #         class_indices = result.class_indices.tolist()
                
        #         # Create a dictionary for each prediction
        #         prediction = {
        #             'boxes': boxes,
        #             'scores': scores,
        #             'class_indices': class_indices
        #         }
        #         predictions.append(prediction)
        #     else:
        #         print("Unexpected result format:", result)

        # print("Predictions made:", predictions)
        # return predictions

my_model = MyModel("../shifumi_trained.pt")
pipeline = InferencePipeline.init_with_custom_logic(
    on_video_frame=my_model.infer,
    video_reference=0,  # Ensure this is the correct device ID for your webcam
    on_prediction=render_boxes,  # Function to run after each prediction
)

pipeline.start()
pipeline.join()

Modèle chargé avec succès
Video frames: 1

0: 384x640 1 person, 488.5ms
Speed: 4.0ms preprocess, 488.5ms inference, 11.8ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[306.0096130371094, 175.88134765625, 997.1483154296875, 714.2239990234375]], 'scores': [0.9610979557037354], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 587.1ms
Speed: 1.7ms preprocess, 587.1ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[313.919921875, 174.76580810546875, 997.4454345703125, 712.3582153320312]], 'scores': [0.9583205580711365], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 505.1ms
Speed: 1.8ms preprocess, 505.1ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[312.42999267578125, 174.77056884765625, 998.7556762695312, 712.1517333984375]], 'scores': [0.9575957655906677], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 476.0ms
Speed: 1.8ms preprocess, 476.0ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[313.8658142089844, 174.11572265625, 998.7926025390625, 712.2420043945312]], 'scores': [0.9593728184700012], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 469.9ms
Speed: 1.7ms preprocess, 469.9ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.2392883300781, 173.839599609375, 996.840576171875, 712.6450805664062]], 'scores': [0.9593580961227417], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 457.1ms
Speed: 2.1ms preprocess, 457.1ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[316.1182861328125, 174.0789794921875, 991.9722900390625, 712.2272338867188]], 'scores': [0.959876537322998], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 466.0ms
Speed: 2.1ms preprocess, 466.0ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.00439453125, 177.16290283203125, 986.3372802734375, 712.3081665039062]], 'scores': [0.9589807987213135], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 459.2ms
Speed: 2.0ms preprocess, 459.2ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.7613525390625, 177.10992431640625, 987.0887451171875, 712.2349243164062]], 'scores': [0.9600796699523926], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 463.5ms
Speed: 1.8ms preprocess, 463.5ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[311.6685791015625, 180.672607421875, 984.397705078125, 712.7371826171875]], 'scores': [0.9568293690681458], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 470.7ms
Speed: 1.8ms preprocess, 470.7ms inference, 0.3ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[313.1903076171875, 179.95947265625, 987.5538330078125, 712.234619140625]], 'scores': [0.9578403830528259], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 450.2ms
Speed: 1.7ms preprocess, 450.2ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[312.28289794921875, 180.7440185546875, 989.3611450195312, 711.6641845703125]], 'scores': [0.9608865976333618], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 459.1ms
Speed: 1.9ms preprocess, 459.1ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[312.7664794921875, 180.8076171875, 989.3802490234375, 711.6505737304688]], 'scores': [0.9589253664016724], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 460.8ms
Speed: 1.3ms preprocess, 460.8ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[313.990234375, 180.830078125, 988.646484375, 711.6004638671875]], 'scores': [0.9605384469032288], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 474.7ms
Speed: 2.4ms preprocess, 474.7ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.22698974609375, 180.58282470703125, 989.1594848632812, 711.68896484375], [101.37298583984375, 655.67138671875, 270.65411376953125, 719.048095703125]], 'scores': [0.9603418111801147, 0.2741149663925171], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 462.9ms
Speed: 1.8ms preprocess, 462.9ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[314.7830810546875, 181.30963134765625, 989.2357177734375, 711.8861694335938]], 'scores': [0.9605764150619507], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 461.1ms
Speed: 1.7ms preprocess, 461.1ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[314.24462890625, 181.3011474609375, 989.0787353515625, 711.748779296875], [99.04507446289062, 654.6950073242188, 270.46453857421875, 719.1561889648438]], 'scores': [0.9613088369369507, 0.2553267478942871], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 459.1ms
Speed: 2.0ms preprocess, 459.1ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[314.4512939453125, 181.36700439453125, 989.0791015625, 711.9288940429688], [101.46151733398438, 654.6685791015625, 270.64239501953125, 719.2545166015625]], 'scores': [0.9614150524139404, 0.28268009424209595], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 472.0ms
Speed: 1.7ms preprocess, 472.0ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[313.246826171875, 181.925048828125, 989.5458984375, 711.879150390625], [100.83212280273438, 655.2952880859375, 270.457275390625, 719.0045166015625]], 'scores': [0.9603214859962463, 0.2546190321445465], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 462.0ms
Speed: 1.8ms preprocess, 462.0ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[311.7054443359375, 182.4794921875, 990.6956787109375, 711.79736328125], [101.14447021484375, 654.8748168945312, 270.43524169921875, 719.1593627929688]], 'scores': [0.9615822434425354, 0.321582555770874], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 460.2ms
Speed: 2.4ms preprocess, 460.2ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[311.4345703125, 181.2064208984375, 990.22607421875, 711.5731811523438], [99.14004516601562, 653.88623046875, 270.22039794921875, 719.0347900390625]], 'scores': [0.9575160145759583, 0.25805309414863586], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 458.6ms
Speed: 1.5ms preprocess, 458.6ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[312.9346008300781, 181.97796630859375, 990.469482421875, 711.7099609375]], 'scores': [0.9601266980171204], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 465.8ms
Speed: 1.9ms preprocess, 465.8ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[314.44488525390625, 181.97332763671875, 989.3024291992188, 711.9839477539062]], 'scores': [0.95587557554245], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 457.1ms
Speed: 1.7ms preprocess, 457.1ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.2807312011719, 181.275634765625, 988.906982421875, 712.3692626953125]], 'scores': [0.9596673846244812], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 464.3ms
Speed: 1.8ms preprocess, 464.3ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[316.1727600097656, 181.6700439453125, 988.8057861328125, 712.6256103515625], [101.21271514892578, 654.53759765625, 270.66552734375, 719.113037109375]], 'scores': [0.9582110643386841, 0.3030565083026886], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 467.6ms
Speed: 1.5ms preprocess, 467.6ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[316.04779052734375, 181.5704345703125, 988.8672485351562, 712.8414306640625], [99.01937103271484, 654.4761962890625, 270.3973693847656, 718.9630126953125]], 'scores': [0.9595453143119812, 0.2919144928455353], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 468.8ms
Speed: 1.8ms preprocess, 468.8ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.7077941894531, 181.83575439453125, 989.29736328125, 712.4058227539062]], 'scores': [0.9560647010803223], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 454.5ms
Speed: 2.6ms preprocess, 454.5ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[316.10528564453125, 173.91790771484375, 988.4219360351562, 712.4647216796875], [100.92050170898438, 654.6000366210938, 270.5944519042969, 719.0004272460938]], 'scores': [0.9565380215644836, 0.25268229842185974], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 473.1ms
Speed: 1.8ms preprocess, 473.1ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[313.8229064941406, 172.9296875, 990.4278564453125, 712.284423828125], [101.00830078125, 654.434326171875, 270.6347351074219, 719.16796875]], 'scores': [0.9553146958351135, 0.2729247510433197], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 482.9ms
Speed: 1.6ms preprocess, 482.9ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[310.6728515625, 174.0367431640625, 991.685791015625, 712.4260864257812], [98.69525146484375, 654.307373046875, 270.2808532714844, 719.0927734375]], 'scores': [0.9561190605163574, 0.26654425263404846], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 465.9ms
Speed: 1.7ms preprocess, 465.9ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[309.8359375, 174.8828125, 992.659912109375, 712.78515625]], 'scores': [0.9559118151664734], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 473.2ms
Speed: 2.0ms preprocess, 473.2ms inference, 0.8ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[311.96453857421875, 174.52630615234375, 992.3617553710938, 712.4212036132812], [100.89290618896484, 655.01708984375, 270.7674865722656, 719.20458984375]], 'scores': [0.9573076963424683, 0.3127821683883667], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 463.9ms
Speed: 2.1ms preprocess, 463.9ms inference, 0.3ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[314.2521057128906, 175.59466552734375, 991.6151123046875, 712.617919921875]], 'scores': [0.9558194279670715], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 478.5ms
Speed: 2.1ms preprocess, 478.5ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[314.72735595703125, 176.05853271484375, 990.7122192382812, 712.5830688476562]], 'scores': [0.9581126570701599], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 546.4ms
Speed: 2.0ms preprocess, 546.4ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.918212890625, 176.9090576171875, 989.9376220703125, 712.7127685546875]], 'scores': [0.9587209820747375], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 517.4ms
Speed: 2.7ms preprocess, 517.4ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.9816589355469, 176.7601318359375, 989.569091796875, 712.537841796875], [101.17961883544922, 654.5431518554688, 270.70697021484375, 719.0830688476562]], 'scores': [0.9587094783782959, 0.26245006918907166], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 480.2ms
Speed: 1.6ms preprocess, 480.2ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.8452453613281, 176.99359130859375, 989.745361328125, 712.7664794921875], [100.7926025390625, 654.871826171875, 270.86029052734375, 719.067626953125]], 'scores': [0.9577887654304504, 0.2844209372997284], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 468.7ms
Speed: 2.2ms preprocess, 468.7ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[314.191650390625, 176.98687744140625, 990.3106689453125, 712.5900268554688], [101.0584716796875, 654.2332763671875, 270.89056396484375, 719.1849365234375]], 'scores': [0.9572760462760925, 0.2794729173183441], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 472.2ms
Speed: 1.6ms preprocess, 472.2ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[313.7710266113281, 176.943359375, 990.446533203125, 712.7822875976562], [101.2657470703125, 655.2548828125, 270.72344970703125, 719.072998046875]], 'scores': [0.9560852646827698, 0.2581758499145508], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 466.2ms
Speed: 2.1ms preprocess, 466.2ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[311.98248291015625, 176.7845458984375, 990.6054077148438, 712.93359375], [101.257568359375, 655.153076171875, 270.4220886230469, 719.083984375]], 'scores': [0.9574387073516846, 0.26740026473999023], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 465.3ms
Speed: 1.5ms preprocess, 465.3ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[314.2143249511719, 176.739013671875, 989.642822265625, 712.573486328125], [101.5699462890625, 654.6785278320312, 270.5197448730469, 719.1287231445312]], 'scores': [0.9534914493560791, 0.32427433133125305], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 482.1ms
Speed: 2.5ms preprocess, 482.1ms inference, 0.8ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[314.5528869628906, 176.1510009765625, 988.3360595703125, 712.4520263671875]], 'scores': [0.9549574851989746], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 472.3ms
Speed: 2.1ms preprocess, 472.3ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[316.1693420410156, 176.2977294921875, 988.0435791015625, 712.531494140625]], 'scores': [0.9562198519706726], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 527.3ms
Speed: 1.4ms preprocess, 527.3ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[316.4900207519531, 176.19970703125, 987.013671875, 712.1905517578125], [101.12350463867188, 654.7845458984375, 270.5705261230469, 719.1136474609375]], 'scores': [0.9567689895629883, 0.28472664952278137], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 477.3ms
Speed: 2.3ms preprocess, 477.3ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[316.66790771484375, 176.7850341796875, 987.3972778320312, 712.27734375]], 'scores': [0.955862820148468], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 480.4ms
Speed: 2.4ms preprocess, 480.4ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.4889831542969, 177.269287109375, 988.344482421875, 712.56640625]], 'scores': [0.9568266272544861], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 469.2ms
Speed: 1.4ms preprocess, 469.2ms inference, 0.3ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.46832275390625, 177.783935546875, 988.5059204101562, 712.6151123046875], [101.58184051513672, 654.84423828125, 270.9498291015625, 719.1868896484375]], 'scores': [0.9585406184196472, 0.29477083683013916], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 483.2ms
Speed: 2.4ms preprocess, 483.2ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[311.7720642089844, 178.395751953125, 989.9708251953125, 712.552978515625], [101.33226776123047, 655.159423828125, 270.54083251953125, 719.102783203125]], 'scores': [0.95371413230896, 0.3121180236339569], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 471.0ms
Speed: 2.4ms preprocess, 471.0ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[309.4234619140625, 178.953125, 990.40771484375, 712.4593505859375], [101.368896484375, 655.19873046875, 271.02154541015625, 719.2042236328125]], 'scores': [0.9563186168670654, 0.37383994460105896], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 469.6ms
Speed: 1.5ms preprocess, 469.6ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[311.1436767578125, 175.908203125, 991.69189453125, 712.14892578125]], 'scores': [0.9560105204582214], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 481.2ms
Speed: 2.2ms preprocess, 481.2ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[312.5103759765625, 176.3665771484375, 991.748291015625, 712.4005737304688]], 'scores': [0.9588909149169922], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 463.3ms
Speed: 2.0ms preprocess, 463.3ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[315.63037109375, 177.56396484375, 991.0518798828125, 712.3284912109375]], 'scores': [0.9592711925506592], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 467.4ms
Speed: 1.6ms preprocess, 467.4ms inference, 0.3ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[300.30419921875, 180.315185546875, 1026.91845703125, 712.439453125]], 'scores': [0.9574718475341797], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 466.6ms
Speed: 1.9ms preprocess, 466.6ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[299.227294921875, 175.1053466796875, 983.7642822265625, 713.26025390625]], 'scores': [0.9541743993759155], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 468.3ms
Speed: 1.7ms preprocess, 468.3ms inference, 0.3ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[282.758056640625, 181.005615234375, 976.3531494140625, 713.7062377929688]], 'scores': [0.957673966884613], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 461.2ms
Speed: 2.0ms preprocess, 461.2ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[307.0533447265625, 183.14013671875, 995.5059814453125, 713.578857421875]], 'scores': [0.9453357458114624], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 473.2ms
Speed: 1.9ms preprocess, 473.2ms inference, 0.3ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[338.701416015625, 193.42718505859375, 1054.45361328125, 713.8762817382812]], 'scores': [0.944580078125], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 470.6ms
Speed: 1.8ms preprocess, 470.6ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[363.4510498046875, 204.46617126464844, 1039.108642578125, 711.8001708984375]], 'scores': [0.9533641338348389], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 479.1ms
Speed: 2.0ms preprocess, 479.1ms inference, 0.8ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[359.9129638671875, 215.55126953125, 1084.4852294921875, 713.2247924804688]], 'scores': [0.9468186497688293], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 468.6ms
Speed: 2.1ms preprocess, 468.6ms inference, 0.3ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[337.8186340332031, 213.429443359375, 1033.8486328125, 714.9857177734375]], 'scores': [0.9538756012916565], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 1 toothbrush, 471.6ms
Speed: 1.3ms preprocess, 471.6ms inference, 0.3ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[296.0246887207031, 203.94740295410156, 1038.59814453125, 712.9737548828125], [654.1046142578125, 551.3095703125, 711.05078125, 637.252685546875], [101.94107055664062, 655.702880859375, 270.72320556640625, 719.1219482421875]], 'scores': [0.94134122133255, 0.5909106731414795, 0.26727718114852905], 'class_indices': [0.0, 79.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 474.3ms
Speed: 2.7ms preprocess, 474.3ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[267.4200439453125, 194.30560302734375, 1047.260986328125, 715.1731567382812]], 'scores': [0.9354923963546753], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 464.6ms
Speed: 2.1ms preprocess, 464.6ms inference, 0.8ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[150.3760986328125, 193.75982666015625, 1049.975830078125, 714.6517333984375]], 'scores': [0.9464744925498962], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 473.3ms
Speed: 1.6ms preprocess, 473.3ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[330.8702392578125, 199.535400390625, 1053.3214111328125, 712.0963134765625]], 'scores': [0.9338381886482239], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 466.7ms
Speed: 1.7ms preprocess, 466.7ms inference, 0.9ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[359.6560363769531, 197.477783203125, 1034.649658203125, 712.634033203125]], 'scores': [0.9476251602172852], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 479.2ms
Speed: 2.1ms preprocess, 479.2ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[370.2364501953125, 196.733642578125, 1026.2945556640625, 712.9046630859375]], 'scores': [0.9548259377479553], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 472.5ms
Speed: 1.5ms preprocess, 472.5ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[368.9527587890625, 202.90545654296875, 1036.6126708984375, 713.91455078125], [101.72057342529297, 654.9841918945312, 270.5858154296875, 719.0919799804688]], 'scores': [0.9486579895019531, 0.2806280851364136], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 tie, 475.8ms
Speed: 1.6ms preprocess, 475.8ms inference, 0.8ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[371.224609375, 205.3511962890625, 1034.62890625, 713.4791259765625], [573.1105346679688, 591.027587890625, 718.1388549804688, 719.188720703125]], 'scores': [0.9501128196716309, 0.40673309564590454], 'class_indices': [0.0, 27.0]}]
Video frames: 1



0: 384x640 1 person, 1 toothbrush, 473.6ms
Speed: 1.5ms preprocess, 473.6ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[366.071533203125, 203.45274353027344, 1035.8001708984375, 713.720947265625], [662.9935302734375, 597.4119873046875, 697.384033203125, 628.1895751953125]], 'scores': [0.9508256316184998, 0.2917153835296631], 'class_indices': [0.0, 79.0]}]
Video frames: 1



0: 384x640 1 person, 1 tie, 1 toilet, 469.2ms
Speed: 1.7ms preprocess, 469.2ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[368.170166015625, 203.9759979248047, 1035.837646484375, 713.5741577148438], [616.6148681640625, 609.177978515625, 672.78662109375, 719.27880859375], [102.09381103515625, 655.8355712890625, 270.5544738769531, 719.0555419921875]], 'scores': [0.9485750794410706, 0.6137323379516602, 0.29717788100242615], 'class_indices': [0.0, 27.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 468.3ms
Speed: 2.7ms preprocess, 468.3ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[350.9642333984375, 207.3763427734375, 1038.8111572265625, 714.0648193359375], [101.9268798828125, 656.0694580078125, 270.6813049316406, 719.1429443359375]], 'scores': [0.9454811215400696, 0.291523814201355], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 464.9ms
Speed: 1.7ms preprocess, 464.9ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[369.2891845703125, 208.38804626464844, 1038.960205078125, 713.3271484375], [101.8501205444336, 656.2150268554688, 270.4405822753906, 719.1454467773438]], 'scores': [0.9422521591186523, 0.2721845805644989], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 481.1ms
Speed: 1.7ms preprocess, 481.1ms inference, 0.3ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[375.0541687011719, 210.01368713378906, 1035.5693359375, 712.7725830078125], [101.73617553710938, 655.6849365234375, 270.52947998046875, 719.1236572265625]], 'scores': [0.9509158730506897, 0.31188035011291504], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 463.8ms
Speed: 2.8ms preprocess, 463.8ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[350.9520263671875, 206.2298126220703, 1027.42626953125, 713.3078002929688]], 'scores': [0.9436962008476257], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 476.9ms
Speed: 2.3ms preprocess, 476.9ms inference, 0.9ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[388.5953674316406, 205.54615783691406, 1027.8175048828125, 711.540283203125]], 'scores': [0.9521703124046326], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 toilet, 474.8ms
Speed: 2.3ms preprocess, 474.8ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[289.6920166015625, 192.1253662109375, 1032.54638671875, 711.7808837890625], [101.53982543945312, 656.1036987304688, 270.6129150390625, 719.0531616210938]], 'scores': [0.9502249956130981, 0.2552475333213806], 'class_indices': [0.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 475.1ms
Speed: 1.6ms preprocess, 475.1ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[125.0347900390625, 144.9036865234375, 1081.9588623046875, 711.05029296875]], 'scores': [0.9601716995239258], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 485.5ms
Speed: 1.9ms preprocess, 485.5ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[125.80801391601562, 148.6881103515625, 1108.3724365234375, 711.374755859375]], 'scores': [0.9501961469650269], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 477.0ms
Speed: 1.5ms preprocess, 477.0ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[244.0419921875, 164.3515625, 1034.343017578125, 711.3367919921875]], 'scores': [0.9512777924537659], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 475.1ms
Speed: 1.9ms preprocess, 475.1ms inference, 0.3ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[128.662353515625, 155.6783447265625, 1230.9130859375, 710.5494384765625]], 'scores': [0.9503864645957947], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 485.3ms
Speed: 1.5ms preprocess, 485.3ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[115.001708984375, 158.3494873046875, 1265.650390625, 711.5159912109375]], 'scores': [0.9585179686546326], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 474.4ms
Speed: 2.2ms preprocess, 474.4ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[142.731201171875, 166.46722412109375, 1279.1246337890625, 710.9976196289062]], 'scores': [0.9604747891426086], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 472.0ms
Speed: 1.5ms preprocess, 472.0ms inference, 0.9ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[149.76513671875, 165.52215576171875, 1278.67431640625, 710.8532104492188]], 'scores': [0.9618844985961914], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 475.2ms
Speed: 2.0ms preprocess, 475.2ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[134.847412109375, 163.92144775390625, 1279.723388671875, 711.0905151367188]], 'scores': [0.949631929397583], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 498.5ms
Speed: 1.3ms preprocess, 498.5ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[337.134521484375, 163.65728759765625, 1261.823974609375, 711.7301025390625]], 'scores': [0.9549861550331116], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 baseball bat, 1 toilet, 474.6ms
Speed: 1.9ms preprocess, 474.6ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[330.0057373046875, 161.49224853515625, 1260.488525390625, 711.2322387695312], [916.5543823242188, 2.37896728515625, 969.6167602539062, 543.9479370117188], [101.23306274414062, 656.5675048828125, 270.4012451171875, 719.2781982421875]], 'scores': [0.9635104537010193, 0.38599008321762085, 0.28031617403030396], 'class_indices': [0.0, 34.0, 61.0]}]
Video frames: 1



0: 384x640 1 person, 1 baseball bat, 483.9ms
Speed: 1.8ms preprocess, 483.9ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[324.208984375, 156.76611328125, 1247.515625, 711.0990600585938], [916.1152954101562, 2.36883544921875, 961.7543334960938, 541.2762451171875]], 'scores': [0.9614242315292358, 0.3883731961250305], 'class_indices': [0.0, 34.0]}]
Video frames: 1



0: 384x640 1 person, 744.4ms
Speed: 2.6ms preprocess, 744.4ms inference, 0.9ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[323.2784423828125, 150.28515625, 1226.8360595703125, 711.745849609375]], 'scores': [0.9628911018371582], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 1 cell phone, 524.0ms
Speed: 2.7ms preprocess, 524.0ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[325.3815612792969, 147.7576904296875, 1211.31787109375, 711.6181030273438], [764.7601318359375, 309.7203369140625, 877.6492919921875, 579.0777587890625]], 'scores': [0.9630725979804993, 0.5111086368560791], 'class_indices': [0.0, 67.0]}]
Video frames: 1



0: 384x640 1 person, 1 cell phone, 483.8ms
Speed: 2.1ms preprocess, 483.8ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[324.97216796875, 150.10125732421875, 1198.378173828125, 711.3168334960938], [775.152587890625, 222.6572265625, 876.9091796875, 480.67108154296875]], 'scores': [0.962877631187439, 0.3132375478744507], 'class_indices': [0.0, 67.0]}]
Video frames: 1



0: 384x640 1 person, 1 cell phone, 525.2ms
Speed: 1.8ms preprocess, 525.2ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[325.9954528808594, 151.527099609375, 1191.8856201171875, 711.3670043945312], [778.80517578125, 312.930908203125, 872.2760009765625, 478.4478759765625]], 'scores': [0.9660178422927856, 0.4881247878074646], 'class_indices': [0.0, 67.0]}]
Video frames: 1



0: 384x640 1 person, 1 cell phone, 519.0ms
Speed: 1.9ms preprocess, 519.0ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[327.3656921386719, 151.46044921875, 1190.51904296875, 711.3143310546875], [781.668212890625, 312.3155517578125, 872.589111328125, 478.26513671875]], 'scores': [0.9655749201774597, 0.5195655226707458], 'class_indices': [0.0, 67.0]}]
Video frames: 1



0: 384x640 1 person, 1 cell phone, 474.8ms
Speed: 2.6ms preprocess, 474.8ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[326.1950988769531, 152.6253662109375, 1191.52001953125, 711.342529296875], [781.4532470703125, 313.3726806640625, 873.550048828125, 475.1702880859375]], 'scores': [0.966218113899231, 0.4963241219520569], 'class_indices': [0.0, 67.0]}]
Video frames: 1



0: 384x640 1 person, 1 cell phone, 469.9ms
Speed: 2.7ms preprocess, 469.9ms inference, 0.4ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[324.4652099609375, 154.34228515625, 1196.2762451171875, 711.2394409179688], [782.4053344726562, 312.7023620605469, 875.4684448242188, 481.0865173339844]], 'scores': [0.9660285115242004, 0.5987857580184937], 'class_indices': [0.0, 67.0]}]
Video frames: 1



0: 384x640 1 person, 467.1ms
Speed: 1.2ms preprocess, 467.1ms inference, 0.8ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[320.8291320800781, 159.767333984375, 1027.154541015625, 712.7158203125]], 'scores': [0.9553879499435425], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 473.0ms
Speed: 2.1ms preprocess, 473.0ms inference, 0.3ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[302.42633056640625, 174.75714111328125, 994.6156616210938, 711.2979736328125]], 'scores': [0.9522188305854797], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 509.8ms
Speed: 1.3ms preprocess, 509.8ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[299.7882385253906, 180.1060791015625, 975.9910888671875, 711.759521484375]], 'scores': [0.956748366355896], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 537.5ms
Speed: 2.0ms preprocess, 537.5ms inference, 0.8ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[311.6809997558594, 174.616455078125, 992.3162841796875, 711.430908203125]], 'scores': [0.9573934674263], 'class_indices': [0.0]}]
Video frames: 1



0: 384x640 1 person, 508.2ms
Speed: 1.9ms preprocess, 508.2ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[314.4383544921875, 173.0677490234375, 992.905029296875, 711.6725463867188]], 'scores': [0.9584246873855591], 'class_indices': [0.0]}]
Video frames: 1



KeyboardInterrupt: 

0: 384x640 1 person, 689.4ms
Speed: 2.2ms preprocess, 689.4ms inference, 0.7ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[316.673828125, 172.3680419921875, 993.9781494140625, 711.6966552734375]], 'scores': [0.9577639102935791], 'class_indices': [0.0]}]
Video frames: 1

0: 384x640 1 person, 504.7ms
Speed: 2.3ms preprocess, 504.7ms inference, 0.6ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[316.6331787109375, 172.14727783203125, 994.423583984375, 711.9906005859375]], 'scores': [0.9573447704315186], 'class_indices': [0.0]}]
Video frames: 1

0: 384x640 1 person, 1 toilet, 511.3ms
Speed: 1.8ms preprocess, 511.3ms inference, 0.5ms postprocess per image at shape (1, 3, 384, 640)
Predictions made: [{'boxes': [[317.3801574707031, 173.082763671875, 994.798095703125, 711.7730712890625], [101.35464477539062, 656.1139526367188, 270.4997253417969, 719.1968383789062]], 'scores': [0.9560822248458862, 0.26452329754829407], 'class_i