# Data process GeoJSON

This code reads geospatial and tabular data, merges them based on a common column, calculates column sums, and rescales selected columns. It generates a GeoJSON file with processed geographic data for Ecuadorian provinces, improving data integration and preparing it for further analysis or visualization.

In [71]:
import geopandas as gpd
import pandas as pd

In [108]:
# Read a GeoPackage file containing Ecuadorian provinces' geometry data into a GeoDataFrame
df = gpd.read_file("ecuador_provincias.gpkg")

# Read a CSV file ("resultadosF.csv") into a Pandas DataFrame
dfdata = pd.read_csv("resultadosF.csv")

In [111]:
# Rename the 'PROVINCIA' column in the 'dfdata' DataFrame to 'DPA_DESPRO'
dfdata = dfdata.rename(columns={'PROVINCIA': 'DPA_DESPRO'})

# Merge the 'df' GeoDataFrame with the 'dfdata' DataFrame on the 'DPA_DESPRO' column, using an inner join
result = pd.merge(df, dfdata, on='DPA_DESPRO', how='inner')

In [129]:
# Calculate the sum of values from multiple columns and assign the result to a new column named 'despues'
result['despues'] = result[['2019_2020INICIO', '2020_2021INICIO',
       '2021_2022INICIO', '2022_2023INICIO']].sum(axis=1)

In [None]:
# Select specific columns from the 'result' DataFrame and create a new DataFrame with only these columns
result = result[['OBJECTID', 'DPA_PROVIN', 'DPA_DESPRO', 'DPA_VALOR', 'DPA_ANIO',
                'REI_CODIGO', 'REN_CODIGO', 'PEE_CODIGO', 'COD_PROVINCIA', 'antes', 'despues', 'Shape_Leng', 'Shape_Area',
                'geometry']]

In [138]:
# Divide the values in the 'antes' column by 10 and update the 'antes' column with the result
result['antes'] = result['antes'] / 10

# Divide the values in the 'despues' column by 4 and update the 'despues' column with the result
result['despues'] = result['despues'] / 4

# Generate GeoJSON

In [137]:
# Save the 'result' object to a GeoJSON file named "capaNueva.json"
result.to_file("capaNueva.json", driver="GeoJSON")