# Preparación del modelo

## Importación de librerías

In [1]:
import glob, os
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import geopandas as gpd
import rasterio as rio
import seaborn as sns

# Carga de datos

## Geodataframe

In [12]:
agebs = gpd.read_file('data/colima/agebs.gpkg')
agebs["area"] = agebs.area / 1000 # ha
agebs.drop(columns=["CVE_ENT","CVE_MUN", "CVE_AGEB","CVE_LOC","geometry"], inplace=True)
agebs = pd.DataFrame(agebs)

## Zonal Statistics

In [14]:
df = pd.read_csv('data/megaGDF.csv')
df = df.merge(agebs, on="CVEGEO")
df.drop(columns=["CVE_ENT","CVE_MUN","CVE_LOC"], inplace=True)
df.head()

Unnamed: 0,CVEGEO,CVE_AGEB,_count,_sum,_mean,class,time,area
0,600200010676,676,0.0,0.0,,Depth,0,381.991619
1,600200010676,676,2918.0,1344.881608,0.460892,Depth,10200,381.991619
2,600200010676,676,2922.0,1347.627452,0.4612,Depth,10500,381.991619
3,600200010676,676,2923.0,1349.16868,0.46157,Depth,10800,381.991619
4,600200010676,676,2924.0,1350.054582,0.461715,Depth,11100,381.991619


## Denue and INV

In [4]:
denue_inv = pd.read_csv('data/denue_inv.csv')
denue_inv.head()

Unnamed: 0,CVE_AGEB,POBTOT,POB0_14_P,P15A29A_P,P30A59A_P,GRAPROES,P_CD_P,VPH_C_EL_P,VPH_EXSA_P,VPH_DREN_P,...,PARATRAN_C,DRENAJEP_C,TRANSCOL_C,ARBOLES_C,ACESOAUT_C,PUESSEMI_C,PUESAMBU_C,escuela,farmacia,hospital
0,273,99,107.54,6.137333,15.728,3.978667,3.346667,33.333333,32.222,33.333333,...,54,54,53,46,54,54,54,1.0,0.0,0.0
1,318,1959,582.91,17.921154,32.048654,10.256538,7.5425,86.151731,86.311923,86.311923,...,164,149,136,102,165,167,164,13.0,6.0,0.0
2,322,2143,617.33,17.74717,30.118113,11.442453,7.085472,88.486038,88.553396,88.553396,...,155,150,144,70,159,155,151,13.0,3.0,3.0
3,362,2342,644.78,21.292,33.82,9.617714,5.100857,91.145714,91.380857,91.380857,...,103,102,97,45,105,102,102,4.0,1.0,1.0
4,411,1140,381.58,17.902195,33.179268,11.79561,4.030732,80.487805,80.487805,80.487805,...,134,133,130,87,68,134,132,12.0,2.0,0.0


## Join

In [15]:
df_full = df.merge(denue_inv, on="CVE_AGEB")
df_full

Unnamed: 0,CVEGEO,CVE_AGEB,_count,_sum,_mean,class,time,area,POBTOT,POB0_14_P,...,PARATRAN_C,DRENAJEP_C,TRANSCOL_C,ARBOLES_C,ACESOAUT_C,PUESSEMI_C,PUESAMBU_C,escuela,farmacia,hospital
0,0600200010676,0676,0.0,0.000000,,Depth,0,381.991619,2119,587.58,...,91,84,87,45,93,88,91,9.0,1.0,0.0
1,0600200010676,0676,2918.0,1344.881608,0.460892,Depth,10200,381.991619,2119,587.58,...,91,84,87,45,93,88,91,9.0,1.0,0.0
2,0600200010676,0676,2922.0,1347.627452,0.461200,Depth,10500,381.991619,2119,587.58,...,91,84,87,45,93,88,91,9.0,1.0,0.0
3,0600200010676,0676,2923.0,1349.168680,0.461570,Depth,10800,381.991619,2119,587.58,...,91,84,87,45,93,88,91,9.0,1.0,0.0
4,0600200010676,0676,2924.0,1350.054582,0.461715,Depth,11100,381.991619,2119,587.58,...,91,84,87,45,93,88,91,9.0,1.0,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
6556,0601000010362,0362,0.0,0.000000,,Velocity,900,227.156848,2342,644.78,...,103,102,97,45,105,102,102,4.0,1.0,1.0
6557,0601000010362,0362,0.0,0.000000,,Velocity,9000,227.156848,2342,644.78,...,103,102,97,45,105,102,102,4.0,1.0,1.0
6558,0601000010362,0362,0.0,0.000000,,Velocity,9300,227.156848,2342,644.78,...,103,102,97,45,105,102,102,4.0,1.0,1.0
6559,0601000010362,0362,0.0,0.000000,,Velocity,9600,227.156848,2342,644.78,...,103,102,97,45,105,102,102,4.0,1.0,1.0


In [16]:
df_full.describe()

Unnamed: 0,_count,_sum,_mean,time,area,POBTOT,POB0_14_P,P15A29A_P,P30A59A_P,GRAPROES,...,PARATRAN_C,DRENAJEP_C,TRANSCOL_C,ARBOLES_C,ACESOAUT_C,PUESSEMI_C,PUESAMBU_C,escuela,farmacia,hospital
count,6318.0,6318.0,5080.0,6561.0,6561.0,6561.0,6561.0,6561.0,6561.0,6561.0,...,6561.0,6561.0,6561.0,6561.0,6561.0,6561.0,6561.0,6561.0,6561.0,6561.0
mean,7897.458371,29355.69,2.452911,12046.91358,399.982035,1770.259259,520.540741,18.291919,32.61174,10.222105,...,112.074074,106.851852,101.925926,61.444444,106.259259,112.666667,111.037037,7.814815,2.666667,0.888889
std,7277.629876,80850.77,5.092213,7058.657977,123.103015,817.774515,249.387994,3.559731,4.771108,1.920535,...,28.738444,29.786312,26.435616,19.62071,31.312771,28.82991,28.188672,5.99451,2.789079,1.165432
min,0.0,0.0,0.0,0.0,201.591953,99.0,107.54,6.137333,15.728,3.978667,...,54.0,54.0,53.0,33.0,52.0,54.0,54.0,1.0,0.0,0.0
25%,484.75,63.38227,0.220432,6000.0,315.090313,1258.0,298.18,16.823333,29.926604,9.434516,...,91.0,82.0,86.0,45.0,81.0,88.0,90.0,3.0,1.0,0.0
50%,6977.0,1946.393,0.72,12000.0,407.209309,1935.0,502.61,18.112558,33.179268,10.188958,...,112.0,108.0,101.0,58.0,102.0,114.0,111.0,6.0,2.0,1.0
75%,13714.0,16457.83,1.86,18300.0,457.6929,2143.0,617.33,20.5275,35.534118,11.442453,...,134.0,133.0,123.0,71.0,129.0,134.0,132.0,12.0,3.0,1.0
max,28751.0,1043661.0,36.3,24300.0,715.165608,4397.0,1341.77,25.398293,40.178511,13.536364,...,164.0,159.0,151.0,112.0,165.0,167.0,164.0,26.0,14.0,4.0
