## Temperature Data Subset

In [22]:
import pandas as pd 
import seaborn as sns 

historic_data = pd.read_csv("../data/NABR_historic.csv")

historic_data.columns

data_colmap = {
    "long" : "longitude",
    "lat" : "latitude",
    "TimePeriod" : "time_period",
    "RCP" : "rep_con_path",
    "treecanopy" : "pct_treecanopy", 
    "Ann_Herb" : "pct_annual_herbcov",
    "Bare" : "pct_bareground",
    "Herb" : "pct_herbcov",
    "Litter" : "pct_plantlittercov",
    "Shrub" : "pct_shrubcov",
    "DrySoilDays_Summer_whole" : "drysoildays_summer",
    "Evap_Summer" : "evap_summer", 
    "ExtremeShortTermDryStress_Summer_whole" : "xtr_st_drysoilstress_summer", 
    "FrostDays_Winter" : "frostdays_winter", 
    "NonDrySWA_Summer_whole" : "nondry_swa_summer",
    "PPT_Winter" : "precipitation_winter", 
    "PPT_Summer" : "precipitation_summer",
    "PPT_Annual" : "precipitation_annual", 
    "T_Winter" : "temp_winter",
    "T_Summer" : "temp_summer", 
    "T_Annual" : "temp_annual", 
    "Tmax_Summer" : "maxtemp_summer", 
    "Tmin_Winter" : "mintemp_winter", 
    "VWC_Winter_whole" : "volwater_winter", 
    "VWC_Spring_whole" : "volwater_spring", 
    "VWC_Summer_whole" : "volwater_summer", 
    "VWC_Fall_whole" : "volwater_fall"
}

historic_data = historic_data.rename(columns=data_colmap)

In [23]:
temp_subset_cols = ["longitude", "latitude", "year", "frostdays_winter", 'temp_winter',
       'temp_summer', 'temp_annual', 'maxtemp_summer', 'mintemp_winter']
temp_subset_hist = historic_data[temp_subset_cols]

temp_data_agg = temp_subset_hist.groupby("year")[['temp_winter',
       'temp_summer', 'temp_annual', 'maxtemp_summer', 'mintemp_winter']].agg("mean").reset_index()

recent_data = pd.read_csv("../data/nearterm_data_2020-2024.csv")
recent_data = recent_data.rename(columns=data_colmap)

temp_subset_cols = ["year", "frostdays_winter", 'temp_winter',
       'temp_summer', 'temp_annual', 'maxtemp_summer', 'mintemp_winter']
temp_subset_recent = recent_data[temp_subset_cols]

cleaned_recent_subset = temp_subset_recent.groupby("year")[['temp_winter',
       'temp_summer', 'temp_annual', 'maxtemp_summer', 'mintemp_winter']].agg("mean").reset_index()

cleaned_temp_subset = pd.merge(temp_data_agg, cleaned_recent_subset, on = ['year', 'temp_winter', 'temp_summer', 'temp_annual',
       'maxtemp_summer', 'mintemp_winter'], how = "outer")
cleaned_temp_subset.to_csv("../data/cleaned_temp_subset.csv")

## Soil Data Subset

In [27]:
historic_data.columns

Index(['longitude', 'latitude', 'year', 'time_period', 'rep_con_path',
       'scenario', 'pct_treecanopy', 'pct_annual_herbcov', 'pct_bareground',
       'pct_herbcov', 'pct_plantlittercov', 'pct_shrubcov',
       'drysoildays_summer', 'evap_summer', 'xtr_st_drysoilstress_summer',
       'frostdays_winter', 'nondry_swa_summer', 'precipitation_winter',
       'precipitation_summer', 'precipitation_annual', 'temp_winter',
       'temp_summer', 'temp_annual', 'maxtemp_summer', 'mintemp_winter',
       'volwater_winter', 'volwater_spring', 'volwater_summer',
       'volwater_fall'],
      dtype='object')

In [29]:
soil_data_cols = ['year', 'drysoildays_summer', 'evap_summer', 'xtr_st_drysoilstress_summer', 'nondry_swa_summer', 'frostdays_winter'] 

soil_data_hist = historic_data[soil_data_cols]
soil_data_recent = recent_data[soil_data_cols]

soil_data_hist_agg = soil_data_hist.groupby("year")[['drysoildays_summer', 'evap_summer', 'xtr_st_drysoilstress_summer', 'frostdays_winter', 'nondry_swa_summer']].agg("mean").reset_index()

soil_data_recent_agg = soil_data_recent.groupby("year")[['drysoildays_summer', 'evap_summer', 'xtr_st_drysoilstress_summer', 'frostdays_winter', 'nondry_swa_summer']].agg("mean").reset_index()

soil_data_agg = pd.merge(soil_data_hist_agg, soil_data_recent_agg, on = ['year', 'drysoildays_summer', 'evap_summer', 'frostdays_winter', 'xtr_st_drysoilstress_summer', 'nondry_swa_summer'], how = "outer")

soil_data_agg.to_csv("../data/soil_data.csv")

## Coverage Data Subset

In [25]:
coverage_cols_agg = ["year", 'pct_treecanopy', 'pct_annual_herbcov', 'pct_bareground',
       'pct_herbcov', 'pct_plantlittercov', 'pct_shrubcov']

coverage_cols_reg = ["latitude", "longitude", "year", 'pct_treecanopy', 'pct_annual_herbcov', 'pct_bareground',
       'pct_herbcov', 'pct_plantlittercov', 'pct_shrubcov']

coverage_data_hist = historic_data[coverage_cols_agg]
coverage_data_recent = recent_data[coverage_cols_agg]

coverage_data_nonagg_hist = historic_data[coverage_cols_reg]
coverage_data_nonagg_recent = recent_data[coverage_cols_reg]

coverage_data_agg_hist = coverage_data_hist.groupby("year")[['pct_treecanopy', 'pct_annual_herbcov', 'pct_bareground',
       'pct_herbcov', 'pct_plantlittercov', 'pct_shrubcov']].agg("mean").reset_index()

coverage_data_agg_recent = coverage_data_recent.groupby("year")[['pct_treecanopy', 'pct_annual_herbcov', 'pct_bareground',
       'pct_herbcov', 'pct_plantlittercov', 'pct_shrubcov']].agg("mean").reset_index()

coverage_data_agg = pd.merge(coverage_data_agg_hist, coverage_data_agg_recent, on = ["year", 'pct_treecanopy', 'pct_annual_herbcov', 'pct_bareground',
       'pct_herbcov', 'pct_plantlittercov', 'pct_shrubcov'], how = "outer")
coverage_data_agg.to_csv("../data/coverage_data_agg.csv")

coverage_data_nonagg = pd.merge(coverage_data_nonagg_hist, coverage_data_nonagg_recent, on = ["latitude", "longitude", "year", 'pct_treecanopy', 'pct_annual_herbcov', 'pct_bareground',
       'pct_herbcov', 'pct_plantlittercov', 'pct_shrubcov'], how = "outer")
coverage_data_nonagg.to_csv("../data/coverage_data_reg.csv")


## Rain Data Subset

In [26]:
rain_cols_agg = ["year", 'precipitation_winter',
       'precipitation_summer', 'precipitation_annual', 'volwater_winter', 'volwater_spring', 'volwater_summer',
       'volwater_fall']

rain_cols_reg = ["year", 'latitude', 'longitude', 'precipitation_winter',
       'precipitation_summer', 'precipitation_annual', 'volwater_winter', 'volwater_spring', 'volwater_summer',
       'volwater_fall']

rain_hist_agg = historic_data[rain_cols_agg]
rain_recent_agg = recent_data[rain_cols_agg]

rain_hist_reg = historic_data[rain_cols_reg]
rain_recent_reg = recent_data[rain_cols_reg]

rain_hist_agg = rain_hist_agg.groupby("year")[['precipitation_winter',
       'precipitation_summer', 'precipitation_annual', 'volwater_winter', 'volwater_spring', 'volwater_summer',
       'volwater_fall']].agg('mean').reset_index()

rain_recent_agg = rain_recent_agg.groupby("year")[['precipitation_winter',
       'precipitation_summer', 'precipitation_annual', 'volwater_winter', 'volwater_spring', 'volwater_summer',
       'volwater_fall']].agg('mean').reset_index()

rain_data_agg = pd.merge(rain_hist_agg, rain_recent_agg, on = ["year", 'precipitation_winter',
       'precipitation_summer', 'precipitation_annual', 'volwater_winter', 'volwater_spring', 'volwater_summer',
       'volwater_fall'], how = "outer")
rain_data_agg.to_csv("../data/rain_data_agg.csv")

rain_data_reg = pd.merge(rain_hist_reg, rain_recent_reg, on = ["year", 'latitude', 'longitude', 'precipitation_winter',
       'precipitation_summer', 'precipitation_annual', 'volwater_winter', 'volwater_spring', 'volwater_summer',
       'volwater_fall'], how = "outer")
rain_data_reg.to_csv("../data/rain_data_reg.csv")