In [4]:
# Convert CSV to COCO JSON file

import csv
import json
import os
from PIL import Image

print(os.getcwd())


/home/cara/oregon_critters/scripts


In [5]:

def csv_to_coco(csv_file_path, output_json_path):
    coco_data = {
        "info": {
            "year": 2023,
            "version": "1.0",
            "description": "CSV to COCO conversion",
            "contributor": "",
            "url": "",
            "date_created": "2023-08-18"
        },
        "licenses": [],
        "categories": [],
        "images": [],
        "annotations": []
    }

    category_id_map = {
    "Bat": 0,
    "CanadaJay": 1,
    "Coyote": 2,
    "PileatedWoodpecker": 3,
    "Owl": 4,
    "Mink": 5,
    "RedFox": 6,
    "Marten": 7,
    "AmericanRobin": 8,
    "DouglasSquirrel": 9,
    "FlyingSquirrel": 10,
    "Grouse": 11,
    "Invertebrate": 12,
    "MountainBeaver": 13,
    "OtherBird": 14,
    "SmallMammal": 15,
    "Warbler": 16,
    "Chickadee": 17,
    "MountainQuail": 18,
    "StripedSkunk": 19,
    "Human": 20,
    "Dog": 21,
    "BlackBear": 22,
    "BlackTailedDeer": 23,
    "Bobcat": 24,
    "Cougar": 25,
    "DarkEyedJunco": 26,
    "GraySquirrel": 27,
    "Herp": 28,
    "NorthernFlicker": 29,
    "Opossum": 30,
    "Rabbit": 31,
    "Racoon": 32,
    "RooseveltElk": 33,
    "SpottedSkunk": 34,
    "StellersJay": 35,
    "Thrush": 36,
    "TownsendsChipmunk": 37,
    "VariedThrush": 38,
    "Weasel": 39,
    "Woodpecker": 40,
    "Woodrat": 41,
    "Wren": 42,
    "GroundSquirrel": 43,
    "GrayFox": 44
}


    # Populate the "categories" section
    categories = []
    for class_name, class_id in category_id_map.items():
        category_info = {
            "id": class_id,
            "name": class_name,
            "supercategory": "object"
        }
        categories.append(category_info)
    
    coco_data['categories'] = categories
    
    image_id_map = {}
    annotation_id = 1

    with open(csv_file_path, 'r') as csv_file:
        csv_reader = csv.DictReader(csv_file)
        for row in csv_reader:
            filename = row['full_path_new']
            class_name_from_csv = row['CName']
            desired_class_id = category_id_map.get(class_name_from_csv)

            if desired_class_id is not None:  # Skip rows with unknown classes
                xmin = float(row['X'])
                ymin = float(row['Y'])
                width = float(row['W'])
                height = float(row['H'])

                if filename in image_id_map:
                    image_id = image_id_map[filename]
                else:
                    image_id = len(coco_data['images']) + 1
                    image_id_map[filename] = image_id

                    image_info = {
                        "id": image_id,
                        "file_name": filename,
                        "width": width,
                        "height": height
                    }

                    coco_data['images'].append(image_info)

                annotation = {
                    "id": annotation_id,
                    "image_id": image_id,
                    "category_id": desired_class_id,
                    "bbox": [xmin, ymin, width, height],
                    "area": width * height,
                    "iscrowd": 0
                }
                coco_data['annotations'].append(annotation)
                annotation_id += 1

    with open(output_json_path, 'w') as output_json_file:
        json.dump(coco_data, output_json_file, indent=4)

In [7]:
## BOTH
csv_file_path = '/home/cara/oregon_critters/sampled_ds_bothB_split.csv'
output_json_path = '/home/cara/oregon_critters/json/dataset_bothB.json'
csv_to_coco(csv_file_path, output_json_path)

In [4]:
## GROUND

##all together
csv_file_path = '/home/cara/oregon_critters/sampled_ds_ground_620_split.csv'
output_json_path = '/home/cara/oregon_critters/json/dataset_ground_620.json'
csv_to_coco(csv_file_path, output_json_path)

##train
# csv_file_path = '/home/cara/oregon_critters/sampled_ds_ground_620_train.csv'
# output_json_path = '/home/cara/oregon_critters/json/dataset_ground_620_train.json'
# csv_to_coco(csv_file_path, output_json_path)

##val
# csv_file_path = '/home/cara/oregon_critters/sampled_ds_ground_620_val.csv'
# output_json_path = '/home/cara/oregon_critters/json/dataset_ground_620_val.json'
# csv_to_coco(csv_file_path, output_json_path)

##test
# csv_file_path = '/home/cara/oregon_critters/sampled_ds_ground_620_test.csv'
# output_json_path = '/home/cara/oregon_critters/json/dataset_ground_620_test.json'
# csv_to_coco(csv_file_path, output_json_path)


In [7]:
## TRAIL

##all together
csv_file_path = '/home/cara/oregon_critters/sampled_ds_trail_180_split.csv'
output_json_path = '/home/cara/oregon_critters/json/dataset_trail_180.json'
csv_to_coco(csv_file_path, output_json_path)

##train
# csv_file_path = '/home/cara/oregon_critters/sampled_ds_trail_180_train.csv'
# output_json_path = '/home/cara/oregon_critters/json/dataset_trail_180_train.json'
# csv_to_coco(csv_file_path, output_json_path)

##val
# csv_file_path = '/home/cara/oregon_critters/sampled_ds_trail_180_val.csv'
# output_json_path = '/home/cara/oregon_critters/json/dataset_trail_180_val.json'
# csv_to_coco(csv_file_path, output_json_path)

##test
csv_file_path = '/home/cara/oregon_critters/sampled_ds_trail_180_test.csv'
output_json_path = '/home/cara/oregon_critters/json/dataset_trail_180_test.json'
csv_to_coco(csv_file_path, output_json_path)