In [None]:
import torch
import torchvision.transforms.v2 as transforms
from data.data_loader import PascalVOCDataLoader, MSCocoDataLoader
from training.encoder import CenternetEncoder
from utils.config import IMG_HEIGHT, IMG_WIDTH
import matplotlib.pyplot as plt


print("GPU is available: ", torch.cuda.is_available())

In [None]:
transform = transforms.Compose(
    [
        transforms.Resize(size=(IMG_WIDTH, IMG_HEIGHT)),
        transforms.ToImage(),
        transforms.ToDtype(torch.float32, scale=True),
    ]
)
voc_encoder = CenternetEncoder(IMG_HEIGHT, IMG_WIDTH)

In [3]:
voc_dataset_loader = PascalVOCDataLoader(dataset_path="../VOC", image_set="val")
voc_dataset = voc_dataset_loader.load(transform, voc_encoder)

In [4]:
voc_batch_ds = list(
    torch.utils.data.DataLoader(
        voc_dataset, num_workers=4, batch_size=32, shuffle=True
    )
)

In [None]:
imgs, lbls = voc_batch_ds[0]
plt.imshow(imgs[0].data.numpy().transpose(1, 2, 0))

In [None]:
coco_encoder = CenternetEncoder(IMG_HEIGHT, IMG_WIDTH, n_classes=90)

In [None]:
coco_dataset_loader = MSCocoDataLoader(dataset_path="../COCO", image_set="val")
coco_dataset = coco_dataset_loader.load(transform, coco_encoder)

In [8]:
coco_batch_ds = list(
    torch.utils.data.DataLoader(
        coco_dataset, num_workers=4, batch_size=32, shuffle=True
    )
)

In [None]:
imgs, lbls = coco_batch_ds[0]
plt.imshow(imgs[0].data.numpy().transpose(1, 2, 0))