## Imports and Setup

In [1]:
import os
import pandas as pd
import geopandas as gpd

import sys
sys.path.insert(0, "../utils/")
import download_utils
import config_utils

import warnings
warnings.filterwarnings('ignore')

%load_ext autoreload
%autoreload 2

## Data Config

In [None]:
cwd = os.path.dirname(os.getcwd())
filename="configs/data_config.yaml"

config_file = os.path.join(cwd, filename)
config = config_utils.create_config(config_file)

## Load Data Files

In [3]:
unicef = download_utils.load_unicef(config)
unicef.sample(3)

INFO:root:Number of CSV files: 39
Processing SLV: 100%|████████████████████| 39/39 [00:12<00:00,  3.06it/s]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/school/unicef.geojson
INFO:root:Data dimensions: (437362, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
402057,UNICEF-KEN-SCHOOL-00003201,UNICEF,KEN,Kenya,Africa,Sub-Saharan Africa,ST JOSEPH SECONDARY SCHOOL-TAPOYO,POINT (35.20760 1.33619),9e8efed7-2a64-3117-8dff-e88bc96ad91e
171757,UNICEF-THA-SCHOOL-00018322,UNICEF,THA,Thailand,Asia,South-eastern Asia,ชุมชนวัดหนองคล้ายางพะเนียด,POINT (102.81766 16.87536),7c796794-e12d-33b6-bd9a-742a186ee617
337052,UNICEF-BRA-SCHOOL-00110650,UNICEF,BRA,Brazil,Americas,Latin America and the Caribbean,RIO D AREIA ROSA OGG E M C DE EI EF,POINT (-51.13668 -25.29594),20b09599-d3ff-3f57-98f7-f01a83eb33f3


## Download Overture Maps Data

In [7]:
overture_schools = download_utils.download_overture(
    config,
    unicef.iso.unique(),
    category="school"
)
overture_schools.sample(3)

Processing SLV: 100%|████████████████████| 39/39 [00:15<00:00,  2.50it/s]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/school/overture.geojson
INFO:root:Data dimensions: (61183, 8), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry
39418,OVERTURE-ZAF-SCHOOL-00012884,OVERTURE,ZAF,South Africa,Africa,Sub-Saharan Africa,Zimele High school,POINT (28.76866 -31.60819)
14469,OVERTURE-THA-SCHOOL-00000428,OVERTURE,THA,Thailand,Asia,South-eastern Asia,Don Bosco Banpong Technological College,POINT (99.90846 13.80133)
25149,OVERTURE-GHA-SCHOOL-00001028,OVERTURE,GHA,Ghana,Africa,Sub-Saharan Africa,Akwatia GCD Quarters D/A Basic School,POINT (-0.80300 6.02955)


In [5]:
overture_nonschools = download_utils.download_overture(
    config,
    unicef.iso.unique(),
    category="non_school",
    exclude="school"
)
overture_nonschools.sample(3)

Processing SLV: 100%|████████████████████| 39/39 [01:58<00:00,  3.04s/it]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/non_school/overture.geojson
INFO:root:Data dimensions: (606471, 8), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry
541025,OVERTURE-BRA-NON_SCHOOL-00386434,OVERTURE,BRA,Brazil,Americas,Latin America and the Caribbean,Labareda Bar e Restaurante,POINT (-34.91897 -8.19144)
171893,OVERTURE-BRA-NON_SCHOOL-00017302,OVERTURE,BRA,Brazil,Americas,Latin America and the Caribbean,COCO S BAR,POINT (-46.36872 -23.51439)
369243,OVERTURE-BRA-NON_SCHOOL-00214652,OVERTURE,BRA,Brazil,Americas,Latin America and the Caribbean,Rio Quente -Hotel Cristal,POINT (-48.75367 -17.77860)


## Download OpenStreetMap Data

In [10]:
osm_schools = download_utils.download_osm(
    config,
    unicef.iso.unique(), 
    category="school"
)
osm_schools.sample(3)

Processing SLV: 100%|████████████████████| 39/39 [00:11<00:00,  3.32it/s]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/school/osm.geojson
INFO:root:Data dimensions: (40726, 8), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry
22652,OSM-BRA-SCHOOL-00012853,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,Escola Familia Agricola Agostinho Romao Da Silva,POINT (-45.13176 -4.58986)
21605,OSM-BRA-SCHOOL-00011806,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,UE Sagrado Coração,POINT (-44.86880 -1.82598)
14844,OSM-BRA-SCHOOL-00005045,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,EMEF Novo Irajá,POINT (-40.23317 -19.90329)


In [11]:
osm_nonschools = download_utils.download_osm(
    config,
    unicef.iso.unique(), 
    category="non_school"
)
osm_nonschools.sample(3)

Processing SLV: 100%|████████████████████| 39/39 [01:21<00:00,  2.08s/it]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/non_school/osm.geojson
INFO:root:Data dimensions: (410420, 8), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry
193902,OSM-ZAF-NON_SCHOOL-00000965,OSM,ZAF,South Africa,Africa,Sub-Saharan Africa,,POINT (28.30223 -25.71512)
303693,OSM-BRA-NON_SCHOOL-00093607,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,Templo Aderalto do Amanhecer,POINT (-57.66404 -16.06128)
311564,OSM-BRA-NON_SCHOOL-00101478,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,Igreja Assembleia De Deus - Missão,POINT (-49.04501 -5.21136)
