In [1]:
# Copyright (c) OpenMMLab. All rights reserved.
import numpy as np
import torch
import warnings
warnings.filterwarnings('ignore')
from mmcv import ConfigDict

from mmdet.models.dense_heads import CenterNetHead

In [7]:
def test_center_head_loss():
    """Tests center head loss when truth is empty and non-empty."""
    s = 256
    img_metas = [{
        'img_shape': (s, s, 3),
        'scale_factor': 1,
        'pad_shape': (s, s, 3)
    }]
    test_cfg = dict(topK=100, max_per_img=100)
    self = CenterNetHead(
        num_classes=80, in_channel=64, feat_channel=64, test_cfg=test_cfg)

    feat = [torch.rand(1, 64, s, s)]
    center_out, wh_out, offset_out = self.forward(feat)
    #print(center_out)
    print('feat:', feat[0].shape)
    print('center_out:', center_out[0].shape)
    print('wh_out:', wh_out[0].shape)
    print('offset_out:', offset_out[0].shape)
    # Test that empty ground truth encourages the network to predict background
    gt_bboxes = [torch.empty((0, 4))]
    print(gt_bboxes)
    print('gt_bboxes:', gt_bboxes[0].shape)
    gt_labels = [torch.LongTensor([])]
    print(gt_labels)
    print('gt_labels:', gt_labels[0].shape)

    gt_bboxes_ignore = None
    empty_gt_losses = self.loss(center_out, wh_out, offset_out, gt_bboxes,
                                gt_labels, img_metas, gt_bboxes_ignore)
    loss_center = empty_gt_losses['loss_center_heatmap']
    loss_wh = empty_gt_losses['loss_wh']
    loss_offset = empty_gt_losses['loss_offset']
    print(loss_center)
    print(loss_wh)
    print(loss_offset)
    assert loss_center.item() > 0, 'loss_center should be non-zero'
    assert loss_wh.item() == 0, (
        'there should be no loss_wh when there are no true boxes')
    assert loss_offset.item() == 0, (
        'there should be no loss_offset when there are no true boxes')

    # When truth is non-empty then both cls and box loss should be nonzero for
    # random inputs
    gt_bboxes = [
        torch.Tensor([[23.6667, 23.8757, 238.6326, 151.8874]]),
    ]
    gt_labels = [torch.LongTensor([2])]
    one_gt_losses = self.loss(center_out, wh_out, offset_out, gt_bboxes,
                              gt_labels, img_metas, gt_bboxes_ignore)
    loss_center = one_gt_losses['loss_center_heatmap']
    loss_wh = one_gt_losses['loss_wh']
    loss_offset = one_gt_losses['loss_offset']
    assert loss_center.item() > 0, 'loss_center should be non-zero'
    assert loss_wh.item() > 0, 'loss_wh should be non-zero'
    assert loss_offset.item() > 0, 'loss_offset should be non-zero'

In [8]:
test_center_head_loss()

feat: torch.Size([1, 64, 256, 256])
center_out: torch.Size([1, 80, 256, 256])
wh_out: torch.Size([1, 2, 256, 256])
offset_out: torch.Size([1, 2, 256, 256])
[tensor([], size=(0, 4))]
gt_bboxes: torch.Size([0, 4])
[tensor([], dtype=torch.int64)]
gt_labels: torch.Size([0])
tensor(899615.6250, grad_fn=<MulBackward0>)
tensor(0., grad_fn=<MulBackward0>)
tensor(0., grad_fn=<MulBackward0>)


In [None]:
def test_centernet_head_get_bboxes():
    """Tests center head generating and decoding the heatmap."""
    s = 256
    img_metas = [{
        'img_shape': (s, s, 3),
        'scale_factor': np.array([1., 1., 1., 1.]),
        'pad_shape': (s, s, 3),
        'batch_input_shape': (s, s),
        'border': (0, 0, 0, 0),
        'flip': False
    }]
    test_cfg = ConfigDict(
        dict(topk=100, local_maximum_kernel=3, max_per_img=100))
    gt_bboxes = [
        torch.Tensor([[10, 20, 200, 240], [40, 50, 100, 200],
                      [10, 20, 100, 240]])
    ]
    gt_labels = [torch.LongTensor([1, 1, 2])]

    self = CenterNetHead(
        num_classes=4, in_channel=1, feat_channel=4, test_cfg=test_cfg)
    self.feat_shape = (1, 1, s // 4, s // 4)
    targets, _ = self.get_targets(gt_bboxes, gt_labels, self.feat_shape,
                                  img_metas[0]['pad_shape'])
    center_target = targets['center_heatmap_target']
    wh_target = targets['wh_target']
    offset_target = targets['offset_target']
    # make sure assign target right
    for i in range(len(gt_bboxes[0])):
        bbox, label = gt_bboxes[0][i] / 4, gt_labels[0][i]    # bbox format [tl_x, tl_y, br_x, br_y]
        ctx, cty = sum(bbox[0::2]) / 2, sum(bbox[1::2]) / 2   # ctx = (tl_x+br_x)/2, cty = (tl_y+br_y)/2
        int_ctx, int_cty = int(sum(bbox[0::2]) / 2), int(sum(bbox[1::2]) / 2)
        w, h = bbox[2] - bbox[0], bbox[3] - bbox[1]  # br_x-tl_x, br_y-tl_y
        x_off = ctx - int(ctx)
        y_off = cty - int(cty)
        assert center_target[0, label, int_cty, int_ctx] == 1  # (B, num_classes, H, W)
        assert wh_target[0, 0, int_cty, int_ctx] == w  # (B, 2, H, W)
        assert wh_target[0, 1, int_cty, int_ctx] == h  
        assert offset_target[0, 0, int_cty, int_ctx] == x_off # (B, 2, H, W)
        assert offset_target[0, 1, int_cty, int_ctx] == y_off 
    # make sure get_bboxes is right
    detections = self.get_bboxes([center_target], [wh_target], [offset_target],
                                 img_metas,
                                 rescale=True,
                                 with_nms=False)
    """
    list[tuple[Tensor, Tensor]]: Each item in result_list is 2-tuple.
                The first item is an (n, 5) tensor, where 5 represent
                (tl_x, tl_y, br_x, br_y, score) and the score between 0 and 1.
                The shape of the second tensor in the tuple is (n,), and
                each element represents the class label of the corresponding
                box.
    """
    out_bboxes = detections[0][0][:3] # torch.size([3,5])
    out_clses = detections[0][1][:3]  # torch.size([3])
    for bbox, cls in zip(out_bboxes, out_clses):
        flag = False
        for gt_bbox, gt_cls in zip(gt_bboxes[0], gt_labels[0]): #bbox在gt_bboxes里有一个对上（所有元素都相同），flag为True。
            if (bbox[:4] == gt_bbox[:4]).all():
                flag = True
        assert flag, 'get_bboxes is wrong'

In [129]:
test_centernet_head_get_bboxes()

In [2]:
s = 256
img_metas = [{
    'img_shape': (s, s, 3),
    'scale_factor': np.array([1., 1., 1., 1.]),
    'pad_shape': (s, s, 3),
    'batch_input_shape': (s, s),
    'border': (0, 0, 0, 0),
    'flip': False
}]
test_cfg = ConfigDict(
    dict(topk=100, local_maximum_kernel=3, max_per_img=100))
gt_bboxes = [
    torch.Tensor([[10, 20, 200, 240], [40, 50, 100, 200],
                    [10, 20, 100, 240]])
]
gt_labels = [torch.LongTensor([1, 1, 2])]

self = CenterNetHead(
    num_classes=4, in_channel=1, feat_channel=4, test_cfg=test_cfg)
self.feat_shape = (1, 1, s // 4, s // 4)
targets, _ = self.get_targets(gt_bboxes, gt_labels, self.feat_shape,
                                img_metas[0]['pad_shape'])
center_target = targets['center_heatmap_target']
wh_target = targets['wh_target']
offset_target = targets['offset_target']

In [1]:
import torch

In [2]:
gt_bboxes = [
        torch.Tensor([[10, 20, 200, 240], [40, 50, 100, 200],
                      [10, 20, 100, 240]])
    ]

In [5]:
len(gt_bboxes[0])

3

In [84]:
bbox = gt_bboxes[0][0] / 4
label = gt_labels[0][0] 

In [86]:
bbox

tensor([ 2.5000,  5.0000, 50.0000, 60.0000])

In [85]:
label

tensor(1)

In [87]:
int_ctx, int_cty = int(sum(bbox[0::2]) / 2), int(sum(bbox[1::2]) / 2)

In [79]:
sum(bbox[0::2]) / 2 - int(sum(bbox[0::2]) / 2)

tensor(0.2500)

In [80]:
int(sum(bbox[0::2]) / 2)

26

In [None]:
center_target

In [None]:
detections = self.get_bboxes([center_target], [wh_target], [offset_target],
                                 img_metas,
                                 rescale=True,
                                 with_nms=False)

In [125]:
out_bboxes = detections[0][0][:3]
out_clses = detections[0][1][:3]

In [136]:
out_clses

tensor([2, 1, 1])

In [137]:
zip(out_bboxes, out_clses)

<zip at 0x7f9ea2874fa0>

In [151]:
for bbox, cls in zip(out_bboxes, out_clses):
        # print('bbox',bbox)
        # print(cls)
        flag = False
        for gt_bbox, gt_cls in zip(gt_bboxes[0], gt_labels[0]):
            # print('gt_bbox',gt_bbox)
            # print(gt_cls)
            if (bbox[:4] == gt_bbox[:4]).all():
                flag = True
            print(flag)
        assert flag, 'get_bboxes is wrong'

False
False
True
True
True
True
False
True
True


In [140]:
out_bboxes[0][:4]

tensor([ 10.,  20., 100., 240.])

In [144]:
gt_bboxes[0][0][:4]

tensor([ 10.,  20., 200., 240.])

In [152]:
(out_bboxes[0][:4] == gt_bboxes[0][2][:4]).all()

tensor(True)