# User Input - Set Data Locations 

In [1]:
## Dropbox directory = working directory
wd = "/Users/meghs/Google Drive/My Drive/Science/model_utilities_data/"
swd = "/Users/meghs/Dropbox/Tropical_Forests_Data_Discovery/"

## Data and figure folders
dd = wd + "AGB_Data/"
sd = swd + 'Spatial_Data/'

## Import Modules

In [2]:
## General
import os
from datetime import date

## Earthshot Model Utilities
import modelUtilities 
from modelUtilities import GetFeatures as gf
from modelUtilities import SetupData

## Get todays date 
today = date.today()
year_now = today.strftime("%Y")

## Set Location of all Spatial Data

In [None]:
## Files 
poorter       = dd + 'Poorter_2016_Data.csv'
cwd_layer     = sd + 'CWD/CWD.bil/CWD.bil'
biomass_layer = sd + "Forest_AGB.tif"
ecoreg_layer  = sd + "Terrestrial_Ecoregions/Terrestrial_Ecoregions.shp"
bio04_layer   = sd + "WorldClim/Bio/wc2.1_2.5m_bio_4.tif"
bio15_layer   = sd + "WorldClim/Bio/wc2.1_2.5m_bio_15.tif"
ppt_folder    = sd + "WorldClim/wc2.1_30s_prec/"
tmax_folder   = sd + "WorldClim/wc2.1_30s_tmax/" 
cec_layer     = sd + "T_CEC_CLAY.nc4"

## Format Poorter Data

In [None]:
df = SetupData.Format_Poorter(poorter)


## Get List of unique site/lat/lon information from poorter data to pull points from

In [None]:
Location_Info = df[['Chronosequence','Latitude','Longitude']]
Location_Info = Location_Info.drop_duplicates()
Location_Info = Location_Info.reset_index(drop = True)


# Call Features from spatial data

## Precipitation

In [None]:
  ppt = gf.Get_AnnualPPT(Location_DF = Location_Info, PPT_Folder = ppt_folder)

## BioClim Variables (function would work for any of them)

In [None]:
bio04 = gf.Get_BioClim(Location_DF = Location_Info, Bio_Location=bio04_layer, BioName= "Bio04")
bio15 = gf.Get_BioClim(Location_DF = Location_Info, Bio_Location=bio15_layer, BioName= "Bio15")
  

## Climatic Water Deficit 

In [None]:
CWD = gf.Get_CWD(Location_DF = Location_Info, CWD_Location=cwd_layer)

## Biome/Ecoregion Information: Currently has error in geopandas sjoin function

In [None]:
#biome = gf.Get_Biome(Location_DF = Location_Info, Bio_Location, BioName)

## Maximum Temperature

In [None]:
tmax = gf.Get_MaxT(Location_DF = Location_Info, MaxT_Folder = tmax_folder)

## Cation Exchange Capacity (metric of soil fertility)

In [None]:
cec = gf.Get_SoilCEC(Location_DF = Location_Info, SoilCEC_Location = cec_layer)

## Merge Back with original poorter data
currently columns are added to the dataset as they are extracted, so whatever is run last will have all the previous data, should probably ammend this on future versions

In [None]:
final_df = df.merge(cec)

# Save newly built out data to CSV

In [None]:
out_filename = dd + "AGB_Data_" + today.strftime("%m.%d.%Y") + ".csv"
final_df.to_csv(out_filename, index = False)

NB: Currently the data 