# Data Download

This notebook demonstrates how to download data from the following sources:
- GigaMaps
- Overture
- OpenStreetMap (OSM)
- Microsoft Building Footprints
- Google Open Buildings
- Global Human Settlements Layer (GHSL)

## Imports and Setup

In [1]:
import pandas as pd
import geopandas as gpd

import os 
os.chdir('../')
from utils import download_utils
from utils import config_utils

import warnings
warnings.filterwarnings('ignore')
warnings.simplefilter('ignore')

%load_ext autoreload
%autoreload 2

## Data Configurations

In [16]:
profile_filename = "configs/creds.share"
config_filename = "configs/data_configs/data_config_ISO_LCA.yaml"
profile_file = os.path.join(os.getcwd(), profile_filename)
config_file = os.path.join(os.getcwd(), config_filename)
config = config_utils.load_config(config_file)

## Download UNICEF

In [15]:
unicef = download_utils.download_unicef(config, profile_file)
print(f"Data dimensions: {unicef.shape}")
unicef.sample(3)

Processing NIC: 100%|████████████████████| 1/1 [00:01<00:00,  1.76s/it]


Data dimensions: (1364, 9)


Unnamed: 0,UID,source,iso,country,region,subregion,name,giga_id_school,geometry
1137,UNICEF-NIC-SCHOOL-00001137,UNICEF,NIC,Nicaragua,Americas,Latin America and the Caribbean,,1137,POINT (-86.46552 12.73560)
682,UNICEF-NIC-SCHOOL-00000682,UNICEF,NIC,Nicaragua,Americas,Latin America and the Caribbean,,682,POINT (-86.11874 12.71894)
1173,UNICEF-NIC-SCHOOL-00001173,UNICEF,NIC,Nicaragua,Americas,Latin America and the Caribbean,,1173,POINT (-86.57574 12.92773)


## Download Overture Maps Data

In [7]:
overture_schools = download_utils.download_overture(config, category="school")
print(f"Data dimensions: {overture_schools.shape}")
overture_schools.sample(3)

  0%|                    | 0/1 [00:00<?, ?it/s]Processing CAF:   0%|                    | 0/1 [00:00<?, ?it/s]Processing CAF: 100%|████████████████████| 1/1 [00:00<00:00,  8.13it/s]Processing CAF: 100%|████████████████████| 1/1 [00:00<00:00,  8.06it/s]

Data dimensions: (42, 9)


Unnamed: 0,UID,source,iso,country,region,subregion,name,giga_id_school,geometry
40,OVERTURE-CAF-SCHOOL-00000100,OVERTURE,CAF,Central African Republic,Africa,Sub-Saharan Africa,Mampho Secondary School,40,POINT (26.36719 6.14055)
37,OVERTURE-CAF-SCHOOL-00000096,OVERTURE,CAF,Central African Republic,Africa,Sub-Saharan Africa,State Public School Shahkot,37,POINT (19.26238 8.62042)
5,OVERTURE-CAF-SCHOOL-00000011,OVERTURE,CAF,Central African Republic,Africa,Sub-Saharan Africa,Zana Community Christian Schools,5,POINT (24.60337 5.61146)


In [9]:
overture_nonschools = download_utils.download_overture(
    config, category="non_school", exclude="school"
)
print(overture_nonschools.shape)
overture_nonschools.sample(3)

Processing TJK: 100%|████████████████████| 1/1 [00:00<00:00,  5.10it/s]


(212, 9)


Unnamed: 0,UID,source,iso,country,region,subregion,name,giga_id_school,geometry
58,OVERTURE-TJK-NON_SCHOOL-00000141,OVERTURE,TJK,Tajikistan,Asia,Central Asia,"Central Republican Stadium Dushanbe, Tajikistan",58,POINT (68.77881 38.58867)
152,OVERTURE-TJK-NON_SCHOOL-00000345,OVERTURE,TJK,Tajikistan,Asia,Central Asia,Office of civil freedoms/Офис гражданских свобод,152,POINT (68.79190 38.56270)
196,OVERTURE-TJK-NON_SCHOOL-00000448,OVERTURE,TJK,Tajikistan,Asia,Central Asia,Barqi Tojik,196,POINT (68.75547 38.58720)


## Download OpenStreetMap (OSM) Data

In [8]:
osm_schools = download_utils.download_osm(config, category="school")
print(osm_schools.shape)
osm_schools.sample(3)

  0%|                    | 0/1 [00:00<?, ?it/s]Processing TJK:   0%|                    | 0/1 [00:00<?, ?it/s]Processing TJK: 100%|████████████████████| 1/1 [00:00<00:00,  1.66it/s]Processing TJK: 100%|████████████████████| 1/1 [00:00<00:00,  1.65it/s]


(732, 9)


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
234,OSM-TJK-SCHOOL-00000234,OSM,TJK,Tajikistan,Asia,Central Asia,,POINT (68.73007 38.57116),234
409,OSM-TJK-SCHOOL-00000409,OSM,TJK,Tajikistan,Asia,Central Asia,,POINT (71.96532 37.18400),409
475,OSM-TJK-SCHOOL-00000475,OSM,TJK,Tajikistan,Asia,Central Asia,,POINT (70.83522 38.54546),475


In [10]:
osm_nonschools = download_utils.download_osm(config, category="non_school")
print(osm_nonschools.shape)
osm_nonschools.sample(3)

Processing TJK: 100%|████████████████████| 1/1 [00:01<00:00,  1.74s/it]


(5512, 9)


Unnamed: 0,UID,source,iso,country,region,subregion,name,geometry,giga_id_school
4337,OSM-TJK-NON_SCHOOL-00004337,OSM,TJK,Tajikistan,Asia,Central Asia,Масҷиди ҷомеи Ҳазрати Шоҳ,POINT (70.57642 39.97346),4337
5117,OSM-TJK-NON_SCHOOL-00005117,OSM,TJK,Tajikistan,Asia,Central Asia,Колхоз Росси,POINT (68.82791 38.56008),5117
2618,OSM-TJK-NON_SCHOOL-00002618,OSM,TJK,Tajikistan,Asia,Central Asia,Суди ноҳия Сангвор,POINT (70.48422 38.69672),2618


## Download Building Footprints

#### Microsoft Building Footprints

In [5]:
download_utils.download_buildings(config, source="ms", verbose=True)

#### Google Open Buildings

In [None]:
download_utils.download_buildings(config, source="google", verbose=True)

## Download Global Human Settlements Layer

#### GHSL BUILT-C

In [11]:
download_utils.download_ghsl(config, type="built_c")

#### GHSL SMOD

In [12]:
download_utils.download_ghsl(config, type="smod")