# scripts to clean png files

In [14]:
# imports
import os
import glob
import json
import pandas as pd

In [15]:
current_path = os.getcwd()

In [16]:
"""
    Collects information based on filenames from collected images
        and from reading csv data
"""

def get_community_data(file_paths:list[str], community_names:dict) -> list:
    all_data = {}

    for file_path in file_paths:
        # reset dictionary
        community_data = {
        "name" : None,
        "filename" : None, 
        }

        # get metadata
        picture = file_path.split("/")[-1]
        comm_code = picture.split(".")[0]
        comm_name = community_names.get(comm_code, "?")

        # append data
        community_data["name"] = comm_name
        community_data["filename"] = picture
        all_data[comm_code] = community_data   

    return all_data

In [17]:
# export to json
def export_to_json(filename: str, all_data: dict) -> None:
    patient_json = json.dumps(all_data, indent=2)

    with open(filename, "w") as json_data:
        json_data.write(patient_json)

# call functions above

In [18]:
""" read csv file """
comm_data = pd.read_csv("../../../Data/final_calgary_communities.csv")
comm_data = comm_data.set_index("COMM_CODE")["NAME"].to_dict()
print(comm_data)

{'ERL': 'ERLTON', 'COA': 'COACH HILL', 'DIA': 'DIAMOND COVE', 'THO': 'THORNCLIFFE', 'FHT': 'FOREST HEIGHTS', 'HAY': 'HAYSBORO', 'CSC': 'CITYSCAPE', 'BLM': 'BELMONT', 'DOV': 'DOVER', 'MRT': 'MARTINDALE', 'WAL': 'WALDEN', 'VAR': 'VARSITY', 'COL': 'COLLINGWOOD', 'QLD': 'QUEENSLAND', 'WOO': 'WOODLANDS', 'OAK': 'OAKRIDGE', 'SOW': 'SOUTHWOOD', 'RDL': 'ROSEDALE', 'APP': 'APPLEWOOD PARK', 'RID': 'RIDEAU PARK', 'ARB': 'ARBOUR LAKE', 'BVD': 'BELVEDERE', 'CPF': 'COPPERFIELD', 'SIG': 'SIGNAL HILL', 'CAM': 'CAMBRIAN HEIGHTS', 'BRT': 'BRITANNIA', 'WBN': 'WOODBINE', 'RUN': 'RUNDLE', 'ERI': 'ERIN WOODS', 'PIN': 'PINERIDGE', 'HIW': 'HIGHWOOD', 'MAL': 'MAYLAND HEIGHTS', 'MAC': 'MACEWAN GLEN', 'DRG': 'DEER RIDGE', 'MOP': 'MOUNT PLEASANT', 'SOV': 'SOUTHVIEW', 'EDG': 'EDGEMONT', 'RED': 'RED CARPET', 'SSD': 'SUNNYSIDE', 'CAP': 'CAPITOL HILL', 'UMR': 'UPPER MOUNT ROYAL', 'SAD': 'SADDLE RIDGE', 'BED': 'BEDDINGTON HEIGHTS', 'PAT': 'PATTERSON', 'SOC': 'SOUTH CALGARY', 'COR': 'CORAL SPRINGS', 'EAU': 'EAU CLAIRE'

In [19]:
""" create dictionary of pictures to access """
pictures = glob.glob("../*") # list of pictures
print(pictures)
picture_data = get_community_data(pictures, comm_data)

export_to_json("communities.json", picture_data)

['../CHR.png', '../DAL.png', '../QLD.png', '../MPL.png', '../NOL.png', '../BLM.png', '../RDL.png', '../BOW.png', '../UNI.png', '../UMR.png', '../ERL.png', '../WOO.png', '../STA.png', '../HAW.png', '../MDH.png', '../DNW.png', '../OGD.png', '../BNF.png', '../BLN.png', '../LMR.png', '../FAL.png', '../TEM.png', '../CIT.png', '../APP.png', '../DOV.png', '../DNE.png', '../CED.png', '../CRM.png', '../PIN.png', '../WLD.png', '../KIN.png', '../EDG.png', '../REN.png', '../KEL.png', '../WWO.png', '../WBN.png', '../BVD.png', '../MRT.png', '../FAI.png', '../FLN.png', '../SVO.png', '../SOM.png', '../THO.png', '../CHW.png', '../SAD.png', '../STR.png', '../CPF.png', '../PEN.png', '../PKD.png', '../ERI.png', '../HAR.png', '../CHA.png', '../CHV.png', '../MAF.png', '../COU.png', '../DIS.png', '../HPK.png', '../DRN.png', '../WHI.png', '../RCK.png', '../WIL.png', '../BRI.png', '../FHT.png', '../TAR.png', '../COA.png', '../SHN.png', '../COV.png', '../MON.png', '../SSD.png', '../SPH.png', '../VAR.png', '../E