## Imports and Setup

In [1]:
import os
import pandas as pd
import geopandas as gpd

import sys
sys.path.insert(0, "../utils/")
import download_utils
import config_utils

import warnings
warnings.filterwarnings('ignore')
warnings.simplefilter('ignore')

%load_ext autoreload
%autoreload 2

## Data Configurations

In [2]:
cwd = os.path.dirname(os.getcwd())
filename="configs/unicef_config.yaml"

config_file = os.path.join(cwd, filename)
config = config_utils.load_config(config_file)

## Load UNICEF Data 

In [3]:
unicef = download_utils.load_unicef(config)
unicef.sample(3)

INFO:root:Number of CSV files: 1
Processing BRA: 100%|████████████████████| 1/1 [00:02<00:00,  2.23s/it]                                                 


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
122743,UNICEF-BRA-SCHOOL-00122743,UNICEF,BRA,Brazil,Americas,Latin America and the Caribbean,,POINT (-52.35253 -31.76653),122743
76230,UNICEF-BRA-SCHOOL-00076230,UNICEF,BRA,Brazil,Americas,Latin America and the Caribbean,,POINT (-48.24363 -18.95644),76230
109251,UNICEF-BRA-SCHOOL-00109251,UNICEF,BRA,Brazil,Americas,Latin America and the Caribbean,,POINT (-50.00232 -25.42589),109251


## Download Overture Maps Data

In [5]:
overture_schools = download_utils.download_overture(config, category="school")
overture_schools.sample(3)

Processing BRA: 100%|████████████████████| 42/42 [00:47<00:00,  1.14s/it]                                               


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
158886,OVERTURE-BRA-SCHOOL-00039755,OVERTURE,BRA,Brazil,Americas,Latin America and the Caribbean,Caixa Escolar C M e I Menino Deus,POINT (-44.22571 -19.44823),
38038,OVERTURE-THA-SCHOOL-00015549,OVERTURE,THA,Thailand,Asia,South-eastern Asia,โรงเรียนเมืองกลางวิทยาคม,POINT (101.26592 16.61291),
93117,OVERTURE-UKR-SCHOOL-00002529,OVERTURE,UKR,Ukraine,Europe,Eastern Europe,Дитяча Музична школа,POINT (33.87071 50.83334),


In [5]:
overture_nonschools = download_utils.download_overture(config, category="non_school", exclude="school")
overture_nonschools.sample(3)

Processing BRA: 100%|████████████████████| 42/42 [02:32<00:00,  3.64s/it]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/non_school/overture.geojson
INFO:root:Data dimensions: (660525, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
5382,OVERTURE-BIH-NON_SCHOOL-00002402,OVERTURE,BIH,Bosnia and Herzegovina,Europe,Southern Europe,Baraćuša,POINT (16.01257 44.70676),
605258,OVERTURE-BRA-NON_SCHOOL-00334784,OVERTURE,BRA,Brazil,Americas,Latin America and the Caribbean,Al Mare Restaurante,POINT (-48.68347 -26.64404),
366212,OVERTURE-BRA-NON_SCHOOL-00095738,OVERTURE,BRA,Brazil,Americas,Latin America and the Caribbean,Private Pub,POINT (-34.84614 -7.14704),


## Download OpenStreetMap (OSM) Data

In [6]:
osm_schools = download_utils.download_osm(config, category="school")
osm_schools.sample(3)

Processing BRA: 100%|████████████████████| 42/42 [00:16<00:00,  2.52it/s]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/school/osm.geojson
INFO:root:Data dimensions: (53094, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
36473,OSM-BRA-SCHOOL-00005521,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,EM Boa União,POINT (-40.80898 -18.72364),
5543,OSM-CRI-SCHOOL-00000400,OSM,CRI,Costa Rica,Americas,Latin America and the Caribbean,Academia Tica,POINT (-84.62352 9.61934),
49459,OSM-BRA-SCHOOL-00018507,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,Ec Nice Lobao,POINT (-44.20108 -2.60638),


In [7]:
osm_nonschools = download_utils.download_osm(config, category="non_school")
osm_nonschools.sample(3)

Processing BRA: 100%|████████████████████| 42/42 [01:37<00:00,  2.31s/it]                                               
INFO:root:Generated /home/itingzon.unicef/giga/data/vectors/non_school/osm.geojson
INFO:root:Data dimensions: (432023, 9), CRS: EPSG:4326


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
267859,OSM-UKR-NON_SCHOOL-00052389,OSM,UKR,Ukraine,Europe,Eastern Europe,Мед-сервіс-buaty,POINT (27.62054 50.59192),
114796,OSM-KEN-NON_SCHOOL-00009741,OSM,KEN,Kenya,Africa,Sub-Saharan Africa,Garden Park,POINT (39.74298 -3.95407),
351573,OSM-BRA-NON_SCHOOL-00035392,OSM,BRA,Brazil,Americas,Latin America and the Caribbean,Paulinho Muquifu,POINT (-45.08585 -21.88101),


## Download Microsoft Building Footprints (MS) Data

In [3]:
download_utils.download_ms(config, verbose=True)

Processing BRA: 100%|████████████████████| 41/41 [00:00<00:00, 1106.16it/s]                                             


## Download Global Human Settlements Layer

In [3]:
download_utils.download_ghsl(config)

--2023-12-17 09:19:09--  https://jeodpp.jrc.ec.europa.eu/ftp/jrc-opendata/GHSL/GHS_BUILT_C_GLOBE_R2023A/GHS_BUILT_C_FUN_E2018_GLOBE_R2023A_54009_10/V1-0/GHS_BUILT_C_FUN_E2018_GLOBE_R2023A_54009_10_V1_0.zip
Resolving jeodpp.jrc.ec.europa.eu (jeodpp.jrc.ec.europa.eu)... 139.191.241.87
Connecting to jeodpp.jrc.ec.europa.eu (jeodpp.jrc.ec.europa.eu)|139.191.241.87|:443... connected.
HTTP request sent, awaiting response... 200 OK
Length: 9505003782 (8.9G) [application/zip]
Saving to: ‘/home/itingzon.unicef/giga/data/rasters/ghsl/ghsl.zip’


2023-12-17 09:30:58 (12.8 MB/s) - ‘/home/itingzon.unicef/giga/data/rasters/ghsl/ghsl.zip’ saved [9505003782/9505003782]

Archive:  /home/itingzon.unicef/giga/data/rasters/ghsl/ghsl.zip
  inflating: /home/itingzon.unicef/giga/data/rasters/ghsl/GHS_BUILT_C_FUN_E2018_GLOBE_R2023A_54009_10_V1_0.tif  
  inflating: /home/itingzon.unicef/giga/data/rasters/ghsl/GHS_BUILT_C_FUN_E2018_GLOBE_R2023A_54009_10_V1_0.tif.ovr  
  inflating: /home/itingzon.unicef/giga/dat

In [7]:
download_utils.download_ghsl(config, type="smod")