In [10]:
import re
import json

## EwasteRecycling_NEW.geojson Data Preprocessing

In [11]:
with open('EwasteRecycling_NEW.geojson', 'r') as file:
    data = json.load(file)

In [12]:
new_features = []
for feature in data['features']:
    properties = feature['properties']
    description = properties.get("Description", "")
    
    building_name_match = re.search(r'ADDRESSBUILDINGNAME<\/th> <td>(.*?)<\/td>', description)
    postal_code_match = re.search(r'ADDRESSPOSTALCODE<\/th> <td>(.*?)<\/td>', description)
    street_name_match = re.search(r'ADDRESSSTREETNAME<\/th> <td>(.*?)<\/td>', description)
    
    building_name = building_name_match.group(1) if building_name_match else ""
    postal_code = postal_code_match.group(1) if postal_code_match else ""
    street_name = street_name_match.group(1) if street_name_match else ""
    
    new_properties = {
        "Building Name": building_name,
        "Street Name": street_name,
        "Postal Code": postal_code
    }
    
    geometry = feature['geometry']
    new_feature = {
        "type": "Feature",
        "properties": new_properties,
        "geometry": geometry
    }
    new_features.append(new_feature)

new_geojson = {
    "type": "FeatureCollection",
    "features": new_features
}

In [13]:
with open('filtered_EwasteRecycling.geojson', 'w') as outfile:
    json.dump(new_geojson, outfile)

## WasteTreatmentGEOJSON.geojson Data Preprocessing

In [14]:
with open('WasteTreatmentGEOJSON.geojson', 'r') as file:
    data = json.load(file)

In [15]:
new_features = []
for feature in data['features']:
    properties = feature['properties']
    description = properties.get("Description", "")
    
    address_blockhouse_number_match = re.search(r'ADDRESSBLOCKHOUSENUMBER<\/th> <td>(.*?)<\/td>', description)
    postal_code_match = re.search(r'ADDRESSPOSTALCODE<\/th> <td>(.*?)<\/td>', description)
    street_name_match = re.search(r'ADDRESSSTREETNAME<\/th> <td>(.*?)<\/td>', description)
    name_match = re.search(r'<th>NAME<\/th>\s*<td>(.*?)<\/td>', description)
    
    address_blockhouse_number = address_blockhouse_number_match.group(1) if address_blockhouse_number_match else ""
    postal_code = postal_code_match.group(1) if postal_code_match else ""
    street_name = street_name_match.group(1) if street_name_match else ""
    name = name_match.group(1) if name_match else ""
    
    new_properties = {
        "Name": name,
        "Block House No.": address_blockhouse_number,
        "Street Name": street_name,
        "Postal Code": postal_code,
    }
    
    geometry = feature['geometry']
    new_feature = {
        "type": "Feature",
        "properties": new_properties,
        "geometry": geometry
    }
    new_features.append(new_feature)

new_geojson = {
    "type": "FeatureCollection",
    "features": new_features
}

In [16]:
with open('filtered_WasteTreatmentGEOJSON.geojson', 'w') as outfile:
    json.dump(new_geojson, outfile)