## Imports and Setup

In [1]:
import os
import pandas as pd
import geopandas as gpd

import sys
sys.path.insert(0, "../utils/")
import download_utils
import config_utils

import warnings
warnings.filterwarnings('ignore')
warnings.simplefilter('ignore')

%load_ext autoreload
%autoreload 2

## Data Config

In [2]:
cwd = os.path.dirname(os.getcwd())
filename="configs/data_config.yaml"

config_file = os.path.join(cwd, filename)
config = config_utils.create_config(config_file)

## Load Data Files

In [3]:
unicef = download_utils.load_unicef(config)
unicef.sample(3)

INFO:root:Number of CSV files: 39
Processing SLV: 100%|████████████████████| 39/39 [00:13<00:00,  2.96it/s]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/school/unicef.geojson
INFO:root:Data dimensions: (437362, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
319038,UNICEF-BRA-SCHOOL-00092569,UNICEF,BRA,Brazil,Americas,Latin America and the Caribbean,PERILLIER MADEMOISELLE,POINT (-46.70824 -23.72955),6c439afd-9808-3428-9339-9db4aeeb4671
85939,UNICEF-NGA-SCHOOL-00061064,UNICEF,NGA,Nigeria,Africa,Sub-Saharan Africa,Kin Kids Science and Arts Nursery and Primary ...,POINT (7.12124 11.17277),98fe4bc6-8d1d-337c-8a3a-67359fdbc6da
173463,UNICEF-THA-SCHOOL-00020028,UNICEF,THA,Thailand,Asia,South-eastern Asia,วัดท่าเสา,POINT (100.46284 17.37023),363596c4-a0bb-3e35-8100-5ae3b559c593


## Download Overture Maps Data

In [4]:
overture_schools = download_utils.download_overture(config, category="school")
overture_schools.sample(3)

Processing BRA: 100%|████████████████████| 42/42 [00:17<00:00,  2.46it/s]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/school/overture.geojson
INFO:root:Data dimensions: (61280, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
46592,OVERTURE-ZAF-SCHOOL-00020608,OVERTURE,ZAF,South Africa,Africa,Sub-Saharan Africa,Turquoise Harmony Institute,POINT (28.05447 -26.13847),
21571,OVERTURE-THA-SCHOOL-00005667,OVERTURE,THA,Thailand,Asia,South-eastern Asia,Kapongpittayakom School.,POINT (98.39729 8.71277),
59008,OVERTURE-BRA-SCHOOL-00002060,OVERTURE,BRA,Brazil,Americas,Latin America and the Caribbean,Khronos School,POINT (-46.52742 -23.65380),


In [5]:
overture_nonschools = download_utils.download_overture(config, category="non_school")
overture_nonschools.sample(3)

Processing BRA: 100%|████████████████████| 42/42 [02:07<00:00,  3.04s/it]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/non_school/overture.geojson
INFO:root:Data dimensions: (607105, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
192565,OVERTURE-NGA-NON_SCHOOL-00003193,OVERTURE,NGA,Nigeria,Africa,Sub-Saharan Africa,Jayz Bar & Lounge,POINT (3.32358 6.65564),
356804,OVERTURE-BRA-NON_SCHOOL-00141231,OVERTURE,BRA,Brazil,Americas,Latin America and the Caribbean,Clinical Pet,POINT (-35.97176 -8.27581),
81218,OVERTURE-UKR-NON_SCHOOL-00005554,OVERTURE,UKR,Ukraine,Europe,Eastern Europe,Coffee time,POINT (35.04421 48.46829),


## Download OpenStreetMap Data

In [6]:
osm_schools = download_utils.download_osm(config, category="school")
osm_schools.sample(3)

Processing BRA: 100%|████████████████████| 42/42 [00:13<00:00,  3.20it/s]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/school/osm.geojson
INFO:root:Data dimensions: (42443, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
2669,OSM-GIN-SCHOOL-00000096,OSM,GIN,Guinea,Africa,Sub-Saharan Africa,École Coranique,POINT (-9.46065 8.54927),
25526,OSM-BRA-SCHOOL-00003465,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,CE Sonho Encantado,POINT (-40.19574 -20.05433),
3108,OSM-GIN-SCHOOL-00000535,OSM,GIN,Guinea,Africa,Sub-Saharan Africa,École primaire de Bourouwal kassa,POINT (-12.50149 11.44960),


In [7]:
osm_nonschools = download_utils.download_osm(config, category="non_school")
osm_nonschools.sample(3)

Processing BRA: 100%|████████████████████| 42/42 [01:27<00:00,  2.09s/it]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/non_school/osm.geojson
INFO:root:Data dimensions: (423445, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
392042,OSM-BRA-NON_SCHOOL-00083556,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,M C L Comércio e Serviços Veterinarios,POINT (-46.37374 -23.95238),
52271,OSM-HUN-NON_SCHOOL-00017207,OSM,HUN,Hungary,Europe,Eastern Europe,Tüskevár,POINT (17.78506 46.05081),
344602,OSM-BRA-NON_SCHOOL-00036116,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,,POINT (-45.05792 -21.18429),
