In [1]:
import torch
from torchvision.models.detection import fasterrcnn_resnet50_fpn
from torchvision.transforms import functional as F
from torchvision.utils import draw_bounding_boxes
from torchvision import transforms
from PIL import Image, ImageDraw
import numpy as np

In [2]:
# Load COCO class labels
class_labels = []
with open("coco.names", "rt") as f:
    class_labels = f.read().rstrip('\n').split('\n')

# Load pre-trained Faster R-CNN model
model = fasterrcnn_resnet50_fpn(pretrained=True)
model.eval()



FasterRCNN(
  (transform): GeneralizedRCNNTransform(
      Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
      Resize(min_size=(800,), max_size=1333, mode='bilinear')
  )
  (backbone): BackboneWithFPN(
    (body): IntermediateLayerGetter(
      (conv1): Conv2d(3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)
      (bn1): FrozenBatchNorm2d(64, eps=0.0)
      (relu): ReLU(inplace=True)
      (maxpool): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)
      (layer1): Sequential(
        (0): Bottleneck(
          (conv1): Conv2d(64, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (bn1): FrozenBatchNorm2d(64, eps=0.0)
          (conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
          (bn2): FrozenBatchNorm2d(64, eps=0.0)
          (conv3): Conv2d(64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (bn3): FrozenBatchNorm2d(256, eps=0.0)
          (relu): ReLU(

In [3]:
# Load an image
image = Image.open("Bus_rides2.jpg")

In [4]:
# Transform the image and make predictions
transform = transforms.Compose([transforms.ToTensor()])
input_image = transform(image).unsqueeze(0)
with torch.no_grad():
    prediction = model(input_image)

In [5]:
# Draw bounding boxes on the image
draw = ImageDraw.Draw(image)
boxes = prediction[0]['boxes']
labels = prediction[0]['labels']
scores = prediction[0]['scores']

for box, label, score in zip(boxes, labels, scores):
    if (label < len(class_labels) and score.item() > 0.5) :
        box = [round(i, 2) for i in box.tolist()]
        label_name = class_labels[label]
        draw.rectangle(box, outline='red', width=3)
        draw.text((box[0], box[1]), f'{label_name} {round(score.item(), 2)}', fill='white')

In [6]:
# Display the result
image.show()