In [1]:
import torch
import torchvision
from torchvision.models.detection import FasterRCNN, fasterrcnn_mobilenet_v3_large_fpn, fasterrcnn_resnet50_fpn_v2
from ultralytics import YOLO
from PIL import Image

In [2]:
from utils import run_validation, RCNN_YOLO, get_model_size

In [3]:
models = {
    'mobilenet_v3_large_fpn': RCNN_YOLO(fasterrcnn_mobilenet_v3_large_fpn(pretrained=True).to('cpu')),
    'resnet50_v2_fpn': RCNN_YOLO(fasterrcnn_resnet50_fpn_v2(pretrained=True).to('cpu')),
    'yolov10s_small': YOLO('yolov10s'),
    'yolov11n_nano': YOLO('yolo11n'),
    'yolov11s_small': YOLO('yolo11s'),
    'yolov11m_medium': YOLO('yolo11m')
}



In [4]:
for name, model in models.items():
    if isinstance(model, RCNN_YOLO):
        get_model_size(model, name=name)
        model.model.model = model.model.model.to('cuda')
    elif isinstance(model, YOLO):
        get_model_size(model, name=name)
        model.model = model.model.to('cuda')
    print(f'Running validation for {name}')
    run_validation(model, name=name, yaml_path='data.yaml')

    # move back to cpu to save memory
    if isinstance(model, RCNN_YOLO):
        get_model_size(model.model.model)
        model.model.model = model.model.model.to('cpu')
    elif isinstance(model, YOLO):
        get_model_size(model.model)
        model.model = model.model.to('cpu')

    print('')

------------------------------
Model name: mobilenet_v3_large_fpn
Model size: 74 MB
Number of parameters: 19.4 million
------------------------------

Running validation for mobilenet_v3_large_fpn
------------------------------
Running validation...
Model: mobilenet_v3_large_fpn
Ultralytics 8.3.34  Python-3.11.10 torch-2.4.1 CUDA:0 (NVIDIA GeForce RTX 3070, 8191MiB)


[34m[1mval: [0mScanning C:\Users\AbduM\Documents\VSCode\DS473-CV-Workspace\project\datasets\labels\val2017.cache... 4952 images, 48 backgrounds, 0 corrupt: 100%|██████████| 5000/5000 [00:00<?, ?it/s]
                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100%|██████████| 5000/5000 [02:20<00:00, 35.60it/s]


                   all       5000      36335      0.647      0.472      0.532      0.339
                person       2693      10777      0.727      0.644      0.707      0.441
               bicycle        149        314      0.649      0.401      0.476      0.239
                   car        535       1918      0.651      0.472      0.528      0.288
            motorcycle        159        367      0.735      0.569      0.666       0.38
              airplane         97        143      0.771      0.769      0.818      0.573
                   bus        189        283      0.776      0.686       0.76      0.599
                 train        157        190      0.798       0.75      0.849       0.63
                 truck        250        414       0.63      0.379      0.486      0.288
                  boat        121        424      0.556      0.417      0.417      0.187
         traffic light        191        634      0.602      0.338      0.377      0.159
          fire hydran

[34m[1mval: [0mScanning C:\Users\AbduM\Documents\VSCode\DS473-CV-Workspace\project\datasets\labels\val2017.cache... 4952 images, 48 backgrounds, 0 corrupt: 100%|██████████| 5000/5000 [00:00<?, ?it/s]
                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100%|██████████| 5000/5000 [06:15<00:00, 13.32it/s]


                   all       5000      36335      0.703      0.615      0.677      0.481
                person       2693      10777       0.78      0.778      0.842      0.604
               bicycle        149        314      0.721       0.56      0.638      0.388
                   car        535       1918      0.737      0.694      0.759       0.51
            motorcycle        159        367      0.798       0.72      0.805      0.508
              airplane         97        143      0.781      0.874      0.901       0.72
                   bus        189        283      0.863      0.795      0.873      0.725
                 train        157        190      0.839      0.847      0.892      0.707
                 truck        250        414       0.73      0.464      0.639      0.436
                  boat        121        424      0.602      0.587      0.606      0.316
         traffic light        191        634      0.682       0.56      0.621      0.338
          fire hydran

[34m[1mval: [0mScanning C:\Users\AbduM\Documents\VSCode\DS473-CV-Workspace\project\datasets\labels\val2017.cache... 4952 images, 48 backgrounds, 0 corrupt: 100%|██████████| 5000/5000 [00:00<?, ?it/s]
                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100%|██████████| 5000/5000 [01:31<00:00, 54.61it/s]


                   all       5000      36335      0.697      0.566      0.625      0.461
                person       2693      10777      0.819        0.7        0.8      0.577
               bicycle        149        314      0.744      0.487      0.578      0.352
                   car        535       1918      0.715      0.576      0.661      0.447
            motorcycle        159        367      0.777      0.657      0.751        0.5
              airplane         97        143      0.786      0.846      0.895      0.736
                   bus        189        283      0.871      0.763      0.829       0.71
                 train        157        190      0.878      0.837      0.902      0.746
                 truck        250        414      0.598      0.468      0.546      0.383
                  boat        121        424      0.736      0.421      0.515      0.289
         traffic light        191        634      0.686       0.41      0.506      0.272
          fire hydran

[34m[1mval: [0mScanning C:\Users\AbduM\Documents\VSCode\DS473-CV-Workspace\project\datasets\labels\val2017.cache... 4952 images, 48 backgrounds, 0 corrupt: 100%|██████████| 5000/5000 [00:00<?, ?it/s]
                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100%|██████████| 5000/5000 [01:29<00:00, 55.68it/s]


                   all       5000      36335      0.652      0.505      0.548      0.392
                person       2693      10777      0.759      0.676      0.753      0.523
               bicycle        149        314      0.686      0.404      0.478      0.275
                   car        535       1918      0.658      0.531      0.583      0.375
            motorcycle        159        367      0.765      0.605      0.679      0.446
              airplane         97        143        0.8      0.797      0.866      0.688
                   bus        189        283      0.769      0.707      0.774       0.65
                 train        157        190      0.832      0.811      0.863      0.681
                 truck        250        414      0.588      0.417      0.478      0.323
                  boat        121        424      0.583      0.354      0.414       0.22
         traffic light        191        634      0.645      0.347      0.416      0.218
          fire hydran

[34m[1mval: [0mScanning C:\Users\AbduM\Documents\VSCode\DS473-CV-Workspace\project\datasets\labels\val2017.cache... 4952 images, 48 backgrounds, 0 corrupt: 100%|██████████| 5000/5000 [00:00<?, ?it/s]
                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100%|██████████| 5000/5000 [01:29<00:00, 55.69it/s]


                   all       5000      36335      0.705      0.577      0.634      0.467
                person       2693      10777      0.809      0.721      0.807      0.585
               bicycle        149        314      0.736      0.478      0.569      0.345
                   car        535       1918      0.732      0.593      0.677      0.457
            motorcycle        159        367      0.785      0.665      0.752      0.499
              airplane         97        143      0.869      0.879      0.931      0.757
                   bus        189        283      0.844       0.77      0.857       0.73
                 train        157        190      0.872      0.861      0.934      0.764
                 truck        250        414      0.624      0.502       0.58      0.413
                  boat        121        424      0.684      0.419      0.518      0.302
         traffic light        191        634      0.687      0.426      0.498      0.267
          fire hydran

[34m[1mval: [0mScanning C:\Users\AbduM\Documents\VSCode\DS473-CV-Workspace\project\datasets\labels\val2017.cache... 4952 images, 48 backgrounds, 0 corrupt: 100%|██████████| 5000/5000 [00:00<?, ?it/s]
                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100%|██████████| 5000/5000 [01:39<00:00, 50.40it/s]


                   all       5000      36335      0.741      0.615      0.681      0.514
                person       2693      10777      0.837      0.746      0.841       0.63
               bicycle        149        314      0.781      0.545      0.654      0.418
                   car        535       1918      0.779      0.654      0.738      0.517
            motorcycle        159        367      0.785      0.711      0.795       0.55
              airplane         97        143      0.904      0.867      0.927      0.793
                   bus        189        283      0.849      0.814      0.888       0.77
                 train        157        190      0.891      0.879      0.938       0.76
                 truck        250        414       0.65      0.529      0.619      0.461
                  boat        121        424      0.728      0.495      0.593      0.354
         traffic light        191        634       0.73      0.451      0.557      0.312
          fire hydran