lbxTorch.py

#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
:Description: Evaluation and conversion script for counting annotated objects on 1 label imported from Labelbox
and converting latter annotations into YOLOv5 format.

:Authors: (c) Valentyna Pryhodiuk <vpryhodiuk@lumais.com>
:Date: 2020-11-04
"""
import json
import os
from argparse import ArgumentParser, ArgumentDefaultsHelpFormatter, SUPPRESS

# Dictionary that maps class names to IDs
class_name_to_id_mapping = {"ant": 0,
                            "ant-head": 1,
                            "trophallaxis-ant": 2,
                            "larva": 3,
                            "trophallaxis-larva": 4,
                            "food-noise": 5,
                            "pupa": 6,
                            "barcode": 7}  # ,"uncategorized": 8}
# we delete uncategorized from possible classes to simplify the process of omitting them

attributes = {'overlapping', 'blurry', "side-view", "low-confidence"}


# convert string <n1>-<n2>, ... into list of beginnings and endings of the respective intervals
def strparse(fstr):
    framelst = fstr.split(',')
    for i, el in enumerate(framelst):
        framelst[i] = el.split('-')
        framelst[i] = framelst[i] * 2 if len(framelst[i]) == 1 else framelst[i]
    return framelst


# Convert the frame dict to the required yolo format and write it to disk
def convert_to_yolo(jsfile, img_size, fstr, filename, outdir):
    """
    Args:
        jsfile (list): list from loaded json file
        img_size (tuple): = (width, height) of the image/frame
        fstr (str): string of intervals <n1>-<n2>,<n3>-<n4>,<n5>...
        filename (str): future name of each txt file will take it as a beginning
        outdir (str): output directory for saving txt files
    """
    # go to an output directory
    if not os.path.isdir(outdir):
        os.makedirs(outdir)
    cwd = os.getcwd()
    os.chdir(os.path.join(cwd, outdir))

    framelst = strparse(fstr)

    for [beginning, ending] in framelst:
        ending = len(jsfile) if ending == '$' else ending

        try:
            for i in range(int(beginning) - 1, int(ending)):
                frame = jsfile[i]
                print_buffer = []

                # For each bounding box
                for obj in frame['objects']:
                    if class_name_to_id_mapping.get(obj["title"]):
                        class_id = class_name_to_id_mapping[obj["title"]]
                        b = obj['bbox']
                        flag = 1  # used to check if object has an attribute = low-confidence
                        if obj['classifications']:
                            for cl in obj['classifications']:
                                for answer in cl['answers']:
                                    flag *= 0 if answer['value'] == 'low-confidence' else 1
                        if not obj['classifications'] or flag:
                            # Transform the bbox coordinates as per the format required by YOLO v5
                            b_center_x = b["left"] + b["width"] / 2
                            b_center_y = b["top"] + b["height"] / 2
                            b_width = b["width"]
                            b_height = b["height"]

                            # Normalise the coordinates by the dimensions of the image
                            image_w, image_h = img_size
                            b_center_x /= image_w
                            b_center_y /= image_h
                            b_width /= image_w
                            b_height /= image_h

                            # Write the bbox details to the file
                            print_buffer.append(
                                "{} {:.3f} {:.3f} {:.3f} {:.3f}".format(class_id, b_center_x, b_center_y, b_width,
                                                                        b_height))
                # print("Invalid Class or uncategorized")
                framenum = str(frame["frameNumber"])
                # Save the annotation to disk
                print("\n".join(print_buffer), file=open('{}_{}.txt'.format(filename, framenum), "w"))
            print('saved as {}/{}_<number>.txt'.format(outdir, filename))
        except IndexError:
            print("WARNING: Invalid frame's range. Number of edited frames is {}".format(len(jsfile)))


# counts number of modified objects on frames, which were listed in the keyframes
def count_objects(jsfile, keyframes, obj_cost):
    """
    jsfile: list from loaded json file
    keyframes: string <n1>-<n2>,<n3>-<n4>,<n5>...
    obj_cost: cost of 1 annotation
    :return: number of modified objects
    """

    # return class if it was deleted to convert json to YOLO
    if not class_name_to_id_mapping.get("uncategorized"):
        class_name_to_id_mapping["uncategorized"] = 8
    cls_count = {key: 0 for key in class_name_to_id_mapping}
    atr_count = {key: 0 for key in attributes}
    # pattern = r'\d+\-\d+,?|\d+'

    # find all the intervals or just separated frame numbers
    framelst = strparse(keyframes)
    suma = 0
    print_buffer = []

    for [beginning, ending] in framelst:
        ending = len(jsfile) if ending == '$' or int(ending) > len(jsfile) else ending

        if not (0 <= int(beginning) - 1 < int(ending)):
            raise IndexError("Invalid frame's range.")
        for i in range(int(beginning) - 1, int(ending)):
            frame = jsfile[i]
            print_buffer.append(frame["frameNumber"])

            # For each obj in frame
            for obj in frame['objects']:
                if obj['keyframe']:  # true, if was changed
                    if obj['title'] in cls_count:
                        cls_count[obj["title"]] += 1
                if obj['classifications']:
                    for classif in obj['classifications']:
                        if classif['answers']:
                            for answer in classif['answers']:
                                if answer['value'] in atr_count and answer['keyframe']:
                                    atr_count[answer['value']] += 1

    print_buffer.sort()
    print("Frames taken to account: ", print_buffer, "\n-----------Classes-----------")
    for key, value in cls_count.items():
        suma += value
        print("{}: {}".format(key, value))
    print("----------Attributes----------")
    for key, value in atr_count.items():
        print("{}: {}".format(key, value))
    if obj_cost:
        print("------------Total-------------")
        print("""Total by class: {} \nCost: ${} \nTotal by attribute: {}""".format(suma,
                                                                                   suma * obj_cost,
                                                                                   sum(list(atr_count.values()))))
    return suma, sum(list(atr_count.values()))


if __name__ == '__main__':
    parser = ArgumentParser(description='Document Taxonomy Builder.',
                            formatter_class=ArgumentDefaultsHelpFormatter,
                            conflict_handler='resolve')
    parser.add_argument('-json-path', '--filepath', nargs='+',
                        help='Path for json files', required=True)
    # parser.add_argument('-vid', '--vid-path', default=None,
    #                     help='Path for the video')

    # create group with mutually exclusive elements: framesize and keyframe-obj
    group = parser.add_mutually_exclusive_group(required=True)
    group.add_argument('-s', '--frame-size', default=None, type=str,
                       help='The size format is WxH, for example: 800x600')
    parser.add_argument('-o', '--outp-dir', type=str,
                        default=os.path.join(os.getcwd(), 'labels'),
                        help='Output directory for the label files')

    parser.add_argument('--object-cost', help=SUPPRESS, default=0.03, type=float)
    parser.add_argument('-f', '--frames', type=str, default='1-$',
                        help='Range of frames')

    group.add_argument('-k', '--keyframed-objects', action="store_true",
                       help='True if annotations should be counted')

    args = parser.parse_args()
    # '-json-path /home/valia/AntVideos/Cflo_troph_count_masked_5-30_6-03-rand1.json -f 5-14 -k'.split())  # -f 1-4

    for filepath in args.filepath:
        with open(filepath) as jsonFile:
            annotations = json.load(jsonFile)
        # with open('data.json', 'w') as f:
        #     json.dump(annotations[:6], f)
        if args.keyframed_objects:
            count_objects(annotations, args.frames, args.object_cost)
        else:
            try:
                fm_size = tuple(map(lambda y: int(y), args.frame_size.split('x')))
                filename = os.path.split(filepath)[1].rstrip('.json')
                convert_to_yolo(annotations, fm_size, args.frames, filename, args.outp_dir)

            except AttributeError:
                print("AttributeError: can't convert annotations, unspecified argument value -s [FRAME_SIZE]." + \
                      "\nTo count annotations in frame range specify -k [keyframed-objects] as True.")