# Preprocessing of the data

In [1]:
import geopandas as gpd
import rtree
import pandas as pd

## Tree data

In [2]:
df_trees = gpd.read_file('../data/geo_data_trees.geojson')
df_trees = df_trees.set_index('Tree ID')

df_trees.head()

Unnamed: 0_level_0,Name,DBH (cm),Replacement Value (eur),Carbon Storage (kg),Carbon Storage (eur),Gross Carbon Sequestration (kg/yr),Gross Carbon Sequestration (eur/yr),Avoided Runoff (mcube/yr),Avoided Runoff (eur/yr),Carbon Avoided (kg/yr),...,Oxygen Production (kg/yr),Height (m),Crown Height (m),Crown Width (m),Canopy Cover (m2),Leaf Area (m2),Leaf Biomass (kg),Latitude,Longitude,geometry
Tree ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
1.0,Acer pseudoplatanus,8,179.43,12.0,1.92,1.1,0.17,0,0.01,,...,2.8,3.5,1.0,1.5,1.8,3.5,0.2,46.051599,11.072014,POINT (11.07201 46.05160)
2.0,Acer pseudoplatanus,8,179.43,12.9,2.07,1.1,0.18,0,0.01,,...,3.0,5.0,1.5,1.5,1.8,4.2,0.3,46.051541,11.072108,POINT (11.07211 46.05154)
3.0,Acer pseudoplatanus,9,227.09,16.2,2.61,1.3,0.2,0,0.01,,...,3.4,4.5,1.3,1.5,1.8,4.0,0.3,46.051668,11.071959,POINT (11.07196 46.05167)
4.0,Acer pseudoplatanus,11,482.46,25.7,4.13,1.6,0.26,0,0.02,,...,4.3,5.0,1.5,2.5,4.9,7.1,0.5,46.063778,11.15017,POINT (11.15017 46.06378)
7.0,Cupressus,25,1110.29,448.2,72.02,11.1,1.78,0,0.02,,...,29.5,8.0,2.4,1.5,1.8,6.6,1.5,46.052305,11.07155,POINT (11.07155 46.05230)


In [3]:
df_trees.to_csv('../data_clean/trees.csv')

## Circoscrizioni

In [4]:
df_circoscrizioni = gpd.read_file('../data/circoscrizioni.json')
df_circoscrizioni.head()

Unnamed: 0,numero_cir,area,perimetro,nome,fumetto,geometry
0,2,15712181,17850,MEANO,Circoscrizione n. 2 - MEANO,"POLYGON ((11.15678 46.11661, 11.15687 46.11666..."
1,3,36949609,38485,BONDONE,Circoscrizione n. 3 - BONDONE,"POLYGON ((11.08026 46.11571, 11.08026 46.11571..."
2,4,8663138,16403,SARDAGNA,Circoscrizione n. 4 - SARDAGNA,"POLYGON ((11.09034 46.07917, 11.09032 46.07899..."
3,6,13199398,20575,ARGENTARIO,Circoscrizione n. 6 - ARGENTARIO,"POLYGON ((11.17163 46.08095, 11.17161 46.08106..."
4,11,3073349,10962,S.GIUSEPPE-S.CHIARA,Circoscrizione n. 11 - S.GIUSEPPE-S.CHIARA,"POLYGON ((11.11135 46.05878, 11.11137 46.05878..."


In [5]:
df_tree_circo = gpd.tools.sjoin(df_trees, df_circoscrizioni, predicate="within", how='left')

Unnamed: 0_level_0,Name,DBH (cm),Replacement Value (eur),Carbon Storage (kg),Carbon Storage (eur),Gross Carbon Sequestration (kg/yr),Gross Carbon Sequestration (eur/yr),Avoided Runoff (mcube/yr),Avoided Runoff (eur/yr),Carbon Avoided (kg/yr),...,Leaf Biomass (kg),Latitude,Longitude,geometry,index_right,numero_cir,area,perimetro,nome,fumetto
Tree ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
1.0,Acer pseudoplatanus,8,179.43,12,1.92,1.1,0.17,0,0.01,,...,0.2,46.051599,11.072014,POINT (11.07201 46.05160),2.0,4.0,8663138.0,16403.0,SARDAGNA,Circoscrizione n. 4 - SARDAGNA
2.0,Acer pseudoplatanus,8,179.43,12.9,2.07,1.1,0.18,0,0.01,,...,0.3,46.051541,11.072108,POINT (11.07211 46.05154),2.0,4.0,8663138.0,16403.0,SARDAGNA,Circoscrizione n. 4 - SARDAGNA
3.0,Acer pseudoplatanus,9,227.09,16.2,2.61,1.3,0.2,0,0.01,,...,0.3,46.051668,11.071959,POINT (11.07196 46.05167),2.0,4.0,8663138.0,16403.0,SARDAGNA,Circoscrizione n. 4 - SARDAGNA
4.0,Acer pseudoplatanus,11,482.46,25.7,4.13,1.6,0.26,0,0.02,,...,0.5,46.063778,11.150170,POINT (11.15017 46.06378),5.0,7.0,15433274.0,18464.0,POVO,Circoscrizione n. 7 - POVO
7.0,Cupressus,25,1110.29,448.2,72.02,11.1,1.78,0,0.02,,...,1.5,46.052305,11.071550,POINT (11.07155 46.05230),2.0,4.0,8663138.0,16403.0,SARDAGNA,Circoscrizione n. 4 - SARDAGNA
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
17664.0,Philadelphus,28.2,1354.8,396.2,63.66,10.7,1.71,0.1,0.13,,...,2.7,46.055851,11.129388,POINT (11.12939 46.05585),9.0,10.0,6962104.0,15418.0,OLTREFERSINA,Circoscrizione n. 10 - OLTREFERSINA
17665.0,Forsythia x intermedia,28.2,1354.8,320.9,51.56,10.5,1.68,0.1,0.21,,...,4.6,46.055402,11.129206,POINT (11.12921 46.05540),9.0,10.0,6962104.0,15418.0,OLTREFERSINA,Circoscrizione n. 10 - OLTREFERSINA
17666.0,Aucuba japonica,28.2,1354.8,356.2,57.22,6.3,1.01,0.1,0.14,,...,2.5,46.055867,11.129650,POINT (11.12965 46.05587),9.0,10.0,6962104.0,15418.0,OLTREFERSINA,Circoscrizione n. 10 - OLTREFERSINA
17667.0,Osmanthus fragrans,28.2,1354.8,240.7,38.67,4.3,0.6899999999999999,0.1,0.15,,...,3.8,46.053467,11.121152,POINT (11.12115 46.05347),4.0,11.0,3073349.0,10962.0,S.GIUSEPPE-S.CHIARA,Circoscrizione n. 11 - S.GIUSEPPE-S.CHIARA


In [45]:
gpd.read_file('../data/circoscrizioni.json')

Unnamed: 0,numero_cir,area,perimetro,nome,fumetto,geometry
0,2,15712181,17850,MEANO,Circoscrizione n. 2 - MEANO,"POLYGON ((11.15678 46.11661, 11.15687 46.11666..."
1,3,36949609,38485,BONDONE,Circoscrizione n. 3 - BONDONE,"POLYGON ((11.08026 46.11571, 11.08026 46.11571..."
2,4,8663138,16403,SARDAGNA,Circoscrizione n. 4 - SARDAGNA,"POLYGON ((11.09034 46.07917, 11.09032 46.07899..."
3,6,13199398,20575,ARGENTARIO,Circoscrizione n. 6 - ARGENTARIO,"POLYGON ((11.17163 46.08095, 11.17161 46.08106..."
4,11,3073349,10962,S.GIUSEPPE-S.CHIARA,Circoscrizione n. 11 - S.GIUSEPPE-S.CHIARA,"POLYGON ((11.11135 46.05878, 11.11137 46.05878..."
5,7,15433274,18464,POVO,Circoscrizione n. 7 - POVO,"POLYGON ((11.18467 46.02957, 11.18467 46.02957..."
6,5,16687779,27197,RAVINA-ROMAGNANO,Circoscrizione n. 5 - RAVINA-ROMAGNANO,"POLYGON ((11.11591 45.98873, 11.11597 45.98890..."
7,8,16409555,24413,MATTARELLO,Circoscrizione n. 8 - MATTARELLO,"POLYGON ((11.11591 45.98873, 11.11644 45.98845..."
8,9,7342864,15395,VILLAZZANO,Circoscrizione n. 9 - VILLAZZANO,"POLYGON ((11.15706 46.01669, 11.15723 46.01684..."
9,10,6962104,15418,OLTREFERSINA,Circoscrizione n. 10 - OLTREFERSINA,"POLYGON ((11.11723 46.04331, 11.11754 46.04306..."
