In [1]:
# coding: utf-8
# This script is modified from https://github.com/lars76/kmeans-anchor-boxes

from __future__ import division, print_function
import sys
import numpy as np

In [2]:
def iou(box, clusters):
    """
    Calculates the Intersection over Union (IoU) between a box and k clusters.
    param:
        box: tuple or array, shifted to the origin (i. e. width and height)
        clusters: numpy array of shape (k, 2) where k is the number of clusters
    return:
        numpy array of shape (k, 0) where k is the number of clusters
    """
    x = np.minimum(clusters[:, 0], box[0])
    y = np.minimum(clusters[:, 1], box[1])
    if np.count_nonzero(x == 0) > 0 or np.count_nonzero(y == 0) > 0:
        raise ValueError("Box has no area")

    intersection = x * y
    box_area = box[0] * box[1]
    cluster_area = clusters[:, 0] * clusters[:, 1]

    iou_ = np.true_divide(intersection, box_area + cluster_area - intersection + 1e-10)
    # iou_ = intersection / (box_area + cluster_area - intersection + 1e-10)

    return iou_


def avg_iou(boxes, clusters):
    """
    Calculates the average Intersection over Union (IoU) between a numpy array of boxes and k clusters.
    param:
        boxes: numpy array of shape (r, 2), where r is the number of rows
        clusters: numpy array of shape (k, 2) where k is the number of clusters
    return:
        average IoU as a single float
    """
    return np.mean([np.max(iou(boxes[i], clusters)) for i in range(boxes.shape[0])])


def translate_boxes(boxes):
    """
    Translates all the boxes to the origin.
    param:
        boxes: numpy array of shape (r, 4)
    return:
    numpy array of shape (r, 2)
    """
    new_boxes = boxes.copy()
    for row in range(new_boxes.shape[0]):
        new_boxes[row][2] = np.abs(new_boxes[row][2] - new_boxes[row][0])
        new_boxes[row][3] = np.abs(new_boxes[row][3] - new_boxes[row][1])
    return np.delete(new_boxes, [0, 1], axis=1)


def kmeans(boxes, k, dist=np.median):
    """
    Calculates k-means clustering with the Intersection over Union (IoU) metric.
    param:
        boxes: numpy array of shape (r, 2), where r is the number of rows
        k: number of clusters
        dist: distance function
    return:
        numpy array of shape (k, 2)
    """
    rows = boxes.shape[0]

    distances = np.empty((rows, k))
    last_clusters = np.zeros((rows,))

    np.random.seed()

    # the Forgy method will fail if the whole array contains the same rows
    clusters = boxes[np.random.choice(rows, k, replace=False)]

    while True:
        for row in range(rows):
            distances[row] = 1 - iou(boxes[row], clusters)

        nearest_clusters = np.argmin(distances, axis=1)

        if (last_clusters == nearest_clusters).all():
            break

        for cluster in range(k):
            clusters[cluster] = dist(boxes[nearest_clusters == cluster], axis=0)

        last_clusters = nearest_clusters

    return clusters


def parse_anno(annotation_path, target_size=None):
    anno = open(annotation_path, 'r')
    result = []
    for idx, line in enumerate(anno):
        #print (line)
        s = line.strip().split(' ')
        try:
            index = s[1].split(',')
        except:
            continue
        #print (index)
        #img_w = int(s[2])
        #img_h = int(s[3])
        img_w = 600
        img_h = 600
        s = index
        #s = s[4:]
        
        box_cnt = len(s) // 5
        for i in range(box_cnt):
            x_min, y_min, x_max, y_max = float(int(s[i*5])), float(int(s[i*5+1])), float(int(s[i*5+2])), float(int(s[i*5+3]))
            width = x_max - x_min
            height = y_max - y_min
            #print (idx, width, height)
            try:
                assert width > 0
                assert height > 0
            except Exception as e:
                print (line)
            # use letterbox resize, i.e. keep the original aspect ratio
            # get k-means anchors on the resized target image size
            if target_size is not None:
                resize_ratio = min(target_size[0] / img_w, target_size[1] / img_h)
                width *= resize_ratio
                height *= resize_ratio
                result.append([width, height])
            # get k-means anchors on the original image size
            else:
                result.append([width, height])
    result = np.asarray(result)
    return result


def get_kmeans(anno, cluster_num=9):

    anchors = kmeans(anno, cluster_num)
    ave_iou = avg_iou(anno, anchors)

    anchors = anchors.astype('int').tolist()

    anchors = sorted(anchors, key=lambda x: x[0] * x[1])

    return anchors, ave_iou


if __name__ == '__main__':
    # target resize format: [width, height]
    # if target_resize is speficied, the anchors are on the resized image scale
    # if target_resize is set to None, the anchors are on the original image scale
    target_size = [544, 544]
    size = target_size[0]
    strides = [size/4, size/8, size/16]
    annotation_path = "/home/yuyue/yuyue/yolo_TCT/yolo_big_patch/train_544.txt"
    anno_result = parse_anno(annotation_path, target_size=target_size)
    anchors, ave_iou = get_kmeans(anno_result, 9)
    
    anchors_new = []
    for num,anchor in enumerate(anchors):
        anchors_new.append(((np.array(anchor)/size)*strides[int(num/3)]).tolist())
    
    print (anchors_new, anchors)
    anchor_string = ''
    for anchor in anchors_new:
        anchor_string += '{},{}, '.format(anchor[0], anchor[1])
    anchor_string = anchor_string[:-2]

    print('anchors are:')
    print(anchor_string)
    print('the average iou is:')
    print(ave_iou)

/hdd/sd2/data/TCT/densenet/data/big_patch_size/data/train/pos/544/14e3bac611e8066b0b23a65a910c90e47fb8534a_247_5687.npy 49,371,51,371,0

/hdd/sd2/data/TCT/densenet/data/big_patch_size/data/train/pos/544/85bb6e67c15c6d5a34dbb9ba2a441da03742eee9_358_10584.npy 80,14,81,14,0

/hdd/sd2/data/TCT/densenet/data/big_patch_size/data/train/pos/544/85bb6e67c15c6d5a34dbb9ba2a441da03742eee9_358_10585.npy 40,14,41,14,0

/hdd/sd2/data/TCT/densenet/data/big_patch_size/data/train/pos/544/85bb6e67c15c6d5a34dbb9ba2a441da03742eee9_358_10586.npy 24,14,25,14,0

/hdd/sd2/data/TCT/densenet/data/big_patch_size/data/train/pos/544/6cfec5eb9cba8576c1a17199476d30aac39c3b29_1071_1623.npy 497,7,497,8,0

/hdd/sd2/data/TCT/densenet/data/big_patch_size/data/train/pos/544/6cfec5eb9cba8576c1a17199476d30aac39c3b29_1071_1624.npy 513,7,513,8,0

/hdd/sd2/data/TCT/densenet/data/big_patch_size/data/train/pos/544/6cfec5eb9cba8576c1a17199476d30aac39c3b29_1071_1625.npy 279,7,279,8,0 399,17,463,82,0

/hdd/sd2/data/TCT/densenet/data

ValueError: Box has no area