In [1]:
import geopandas as gpd
import pandas as pd
import numpy as np
from copy import deepcopy

In [2]:
chirps_file = "../Data/vietnam/fluvial_defended/FD_1in500.csv"
chirps_ori = pd.read_csv(chirps_file)
chirps_ori.dropna(inplace=True)
chirps_ori.columns = ['Lon', 'Lat', 'flood_level']

In [3]:
chirps_data = deepcopy(chirps_ori)
chirps_data.describe()

Unnamed: 0,Lon,Lat,flood_level
count,10021110.0,10021110.0,10021110.0
mean,106.3773,14.64911,283.2828
std,1.293058,4.776309,448.61
min,102.1692,8.366667,0.01000005
25%,105.5158,10.345,0.9276007
50%,106.085,12.53167,2.431173
75%,107.0567,20.28583,999.0
max,109.5075,23.16583,999.0


In [4]:
# remove permanent water body to reduce calculation time
chirps_data = chirps_data.where(chirps_data['flood_level'] < 999)
# chirps_data.dropna(inplace=True)
# chirps_data.reset_index(drop=True, inplace=True)

In [5]:
chirps_data['Lon'] = chirps_data['Lon'].apply(lambda x: round(x, 3))
chirps_data['Lat'] = chirps_data['Lat'].apply(lambda x: round(x, 3))

In [6]:
# as we round the coordinates, there exist duplicate coordinate pairs with different flood level
# I use max to emphasize the severity of the flood chance
aggregation_functions = {'flood_level': 'max'}
chirps_data = chirps_data.groupby(['Lon', 'Lat']).aggregate(aggregation_functions)
# chirps_data.drop_duplicates(inplace=True)

In [7]:
# chirps_ori.describe()
chirps_data.describe()
# df_new.describe()

Unnamed: 0,flood_level
count,5095788.0
mean,2.135067
std,2.165022
min,0.01000005
25%,0.589157
50%,1.521703
75%,2.83113
max,10.0


In [8]:
facs_file = "../Data/stroke-facs.csv"
stroke_data = pd.read_csv(facs_file)[['Name_English','longitude','latitude','pro_name_e','dis_name_e']]
stroke_data.columns = ['Facility_Name','Lon','Lat','Province','District']
stroke_data['Lon'] = stroke_data['Lon'].apply(lambda x: round(x, 3))
stroke_data['Lat'] = stroke_data['Lat'].apply(lambda x: round(x, 3))

In [9]:
stroke_data[:10]

Unnamed: 0,Facility_Name,Lon,Lat,Province,District
0,115 People's Hospital,106.667,10.775,Ho Chi Minh City,District 10
1,University Medical Center HCMC-Branch 1,106.664,10.756,Ho Chi Minh City,District 5
2,Nhan Dan Gia Dinh Hospital,106.694,10.804,Ho Chi Minh City,Binh Thanh District
3,Nguyen Tri Phuong Hospital,106.67,10.755,Ho Chi Minh City,District 5
4,Thu Duc District Hospital,106.745,10.865,Ho Chi Minh City,Thu Duc District
5,An Binh Hospital,106.671,10.755,Ho Chi Minh City,District 5
6,Thong Nhat Hospital,106.653,10.792,Ho Chi Minh City,Tan Binh District
7,District 2 General Hospital,106.768,10.782,Ho Chi Minh City,District 2
8,Hoan My Saigon Hospital (CS1) Hoan My Group,106.684,10.8,Ho Chi Minh City,Phu Nhuan District
9,Tan Phu District Hospital,106.642,10.784,Ho Chi Minh City,Tan Phu District


In [10]:
facs_w_flood = stroke_data.merge(chirps_data, how='left', on=['Lon', 'Lat'])

In [11]:
facs_w_flood.dropna()

Unnamed: 0,Facility_Name,Lon,Lat,Province,District,flood_level
7,District 2 General Hospital,106.768,10.782,Ho Chi Minh City,District 2,1.423614
15,Xuyen A General Hospital (BVXA-HCMC),106.558,10.927,Ho Chi Minh City,Cu Chi District,3.151815
20,Vinmec International General Hospital-Central ...,106.72,10.795,Ho Chi Minh City,Binh Thanh District,0.509302
25,Tam Duc Heart Hospital,106.718,10.734,Ho Chi Minh City,District 7,0.748048
27,Bach Mai Hospital,105.841,21.002,Ha Noi,Dong Da District,1.11588
28,103 Military Hospital,105.79,20.967,Ha Noi,Ha Dong District,4.654653
30,Hanoi Thanh Nhan Municipal Hospital (formerly ...,105.859,21.003,Ha Noi,Hai Ba Trung District,0.826574
32,105 Military Hospital,105.496,21.117,Ha Noi,Son Tay Town,4.906386
33,E Hospital,105.79,21.051,Ha Noi,Cau Giay District,3.747965
34,Hanoi Medical University Hospital,105.83,21.002,Ha Noi,Dong Da District,1.199341
