## Imports and Setup

In [1]:
import os
import pandas as pd
import geopandas as gpd

import sys
sys.path.insert(0, "../utils/")
import download_utils
import config_utils

import warnings
warnings.filterwarnings('ignore')
warnings.simplefilter('ignore')

%load_ext autoreload
%autoreload 2

## Data Configurations

In [2]:
cwd = os.path.dirname(os.getcwd())
filename="configs/data_config.yaml"

config_file = os.path.join(cwd, filename)
config = config_utils.create_config(config_file)

## Load UNICEF Data 

In [3]:
unicef = download_utils.load_unicef(config)
unicef.sample(3)

INFO:root:Number of CSV files: 41
Processing SLV: 100%|████████████████████| 41/41 [00:19<00:00,  2.13it/s]                                                                                                   
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/school/unicef.geojson
INFO:root:Data dimensions: (471606, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
149610,UNICEF-UZB-SCHOOL-00006250,UNICEF,UZB,Uzbekistan,Asia,Central Asia,"62,Beruniy,Karakalpakstan",POINT (60.74413 41.68336),95ade0cb-ebea-3ecd-8026-bd0b3299d81f
319263,UNICEF-BRA-SCHOOL-00092794,UNICEF,BRA,Brazil,Americas,Latin America and the Caribbean,OTTONIEL JUNQUEIRA PROFESSOR,POINT (-47.00281 -24.31819),4a2e3bbc-7330-3de0-a90d-0962e06f9855
393669,UNICEF-SSD-SCHOOL-00000975,UNICEF,SSD,South Sudan,Africa,Sub-Saharan Africa,Malual One Primary school,POINT (29.29315 7.00136),d187d673-ee99-3c00-83bb-e46ceccbe31f


## Download Overture Maps Data

In [3]:
overture_schools = download_utils.download_overture(config, category="school")
overture_schools.sample(3)

Processing ZWE: 100%|████████████████████| 42/42 [00:24<00:00,  1.71it/s]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/school/overture.geojson
INFO:root:Data dimensions: (90075, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
72468,OVERTURE-ZAF-SCHOOL-00006631,OVERTURE,ZAF,South Africa,Africa,Sub-Saharan Africa,Thaba Morula High School,POINT (22.23735 -33.60360),
2012,OVERTURE-BRA-SCHOOL-00001412,OVERTURE,BRA,Brazil,Americas,Latin America and the Caribbean,Amanda Instituto de Beleza,POINT (-45.51610 -21.35730),
35043,OVERTURE-KEN-SCHOOL-00000436,OVERTURE,KEN,Kenya,Africa,Sub-Saharan Africa,North Airport Schools,POINT (36.97234 -1.28482),


In [4]:
overture_nonschools = download_utils.download_overture(config, category="non_school", exclude="school")
overture_nonschools.sample(3)

Processing ZWE: 100%|████████████████████| 42/42 [02:48<00:00,  4.02s/it]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/non_school/overture.geojson
INFO:root:Data dimensions: (734990, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
169043,OVERTURE-BRA-NON_SCHOOL-00161936,OVERTURE,BRA,Brazil,Americas,Latin America and the Caribbean,Balacobaco ROCK Burger - Hamburgueria e PUB,POINT (-46.03531 -23.41346),
35695,OVERTURE-BRA-NON_SCHOOL-00028588,OVERTURE,BRA,Brazil,Americas,Latin America and the Caribbean,Barbearia Brother's,POINT (-42.70625 -18.82322),
427210,OVERTURE-HND-NON_SCHOOL-00004926,OVERTURE,HND,Honduras,Americas,Latin America and the Caribbean,Restaurante Agua Verdosa,POINT (-87.32534 13.95012),


## Download OpenStreetMap (OSM) Data

In [6]:
osm_schools = download_utils.download_osm(config, category="school")
osm_schools.sample(3)

Processing ZWE: 100%|████████████████████| 42/42 [00:13<00:00,  3.22it/s]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/school/osm.geojson
INFO:root:Data dimensions: (44405, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
12406,OSM-BRA-SCHOOL-00011009,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,CEJA Prof Milton Marques Curvo,POINT (-57.69096 -16.07752),
40006,OSM-THA-SCHOOL-00001422,OSM,THA,Thailand,Asia,South-eastern Asia,โรงเรียนบ้านหนองพรหม,POINT (101.24692 13.36741),
43926,OSM-ZAF-SCHOOL-00000825,OSM,ZAF,South Africa,Africa,Sub-Saharan Africa,Hoerskool Diamant,POINT (24.77248 -28.75135),


In [7]:
osm_nonschools = download_utils.download_osm(config, category="non_school")
osm_nonschools.sample(3)

Processing ZWE: 100%|████████████████████| 42/42 [01:29<00:00,  2.12s/it]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/non_school/osm.geojson
INFO:root:Data dimensions: (429344, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
84016,OSM-BRA-NON_SCHOOL-00071259,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,Rei do Sushi,POINT (-38.54053 -3.73940),
65427,OSM-BRA-NON_SCHOOL-00052670,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,Posto Azevedo,POINT (-42.69013 -13.01851),
80196,OSM-BRA-NON_SCHOOL-00067439,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,Salgados CWB,POINT (-49.25052 -25.38093),


## Download Microsoft Building Footprints (MS) Data

In [None]:
download_utils.download_msf(config, verbose=True)