# Notebook Setup

In [1]:
if 'google.colab' in str(get_ipython()):
  IN_COLLAB = True
else:
  IN_COLLAB = False

#TODO: CHANGE THIS BASED ON YOUR OWN LOCAL SETTINGS
MY_HOME_ABS_PATH = "/content/drive/MyDrive/W210/co2-flux-hourly-gpp-modeling"

if IN_COLLAB:
  from google.colab import drive
  drive.mount('/content/drive/')

Drive already mounted at /content/drive/; to attempt to forcibly remount, call drive.mount("/content/drive/", force_remount=True).


## Import Modules

In [2]:
# install required modules quietly
required_packages = ['geopandas', 'pyspark', 'azure-storage-blob']

for p in required_packages: 
  try:
      __import__(p)
  except ImportError:
      %pip install {p} --quiet

In [3]:
import os
os.environ["PYARROW_IGNORE_TIMEZONE"] = "1"
import math
import json

from pyspark.sql.functions import col
import pyspark.pandas as pd
from calendar import monthrange
from datetime import datetime
from io import BytesIO

import matplotlib.pyplot as plt
import plotly.express as px
import plotly.graph_objects as go

# Load locale custome modules
import sys
if IN_COLLAB:
  os.chdir(MY_HOME_ABS_PATH)
  sys.path.insert(0,os.path.abspath("./code/src/tools"))
else:
  sys.path.append(os.path.abspath("./code/src/tools"))

from CloudIO.AzStorageClient import AzStorageClient
from data_pipeline_lib import *

pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', None)
pd.set_option('display.float_format', lambda x: '%.5f' % x)

In [4]:
# Import SparkSession
from pyspark.sql import SparkSession
# Create a Spark Session
spark = SparkSession.builder.master("local[*]").config(
    "spark.jars.packages", 
    "org.apache.hadoop:hadoop-azure:3.3.1,com.microsoft.azure:azure-storage:8.6.6"
    ).getOrCreate()
# Check Spark Session Information
spark

# Constant Definitions

In [5]:
root_dir =  MY_HOME_ABS_PATH
tmp_dir =  root_dir + os.sep + '.tmp'
raw_data_dir = tmp_dir
data_dir = root_dir + os.sep + 'data'
cred_dir = root_dir + os.sep + '.cred'
az_cred_file = cred_dir + os.sep + 'azblobcred.json'

if IN_COLLAB:
  raw_data_dir = "/content/drive/MyDrive/CO2_flux_gpp_modeling/DS_capstone_23Spring_CO2/Data"

monthly_data_filename = raw_data_dir + os.sep + 'data_monthly_v1_0.csv'
interpolated_monthly_data_filename = data_dir + os.sep + "monthly-interpolated.csv"

# Load Monthly Data

Full features from the monthly data:
```
['SITE_ID', 'year', 'month', 'time', 'TIMESTAMP', 'dataset',
'LOCATION_LAT', 'LOCATION_LONG',
'TA_F', 'VPD_F', 'P_F', 'NETRAD',
'NEE_VUT_REF', 'NEE_VUT_REF_QC', 'NEE_CUT_REF', 'NEE_CUT_REF_QC', 'GPP_NT_VUT_REF', 'GPP_DT_VUT_REF', 'GPP_NT_CUT_REF', 'GPP_DT_CUT_REF', 'RECO_NT_VUT_REF', 'RECO_DT_VUT_REF', 'RECO_NT_CUT_REF', 'RECO_DT_CUT_REF',
'ET', 'BESS-PAR', 'BESS-PARdiff', 'BESS-RSDN', 'CSIF-SIFdaily', 'CSIF-SIFinst', 'PET', 'Ts', 'Tmean', 'prcp', 'vpd', 'prcp-lag3', 'ESACCI-sm', 'MODIS_LC', 'b1', 'b2', 'b3', 'b4', 'b5', 'b6', 'b7', 'EVI', 'GCI', 'NDVI', 'NDWI', 'NIRv', 'kNDVI',
'Percent_Snow', 'Fpar', 'Lai', 'LST_Day', 'LST_Night',
'SITE_IGBP', 'MODIS_IGBP','MODIS_PFT', 'koppen_sub', 'koppen', 'CO2_concentration']
```

In [6]:
included_features= ['SITE_ID', 'year', 'month', 'TIMESTAMP',
                   'ESACCI-sm',    # ESACCI Soil Moisture (%)
                   'Percent_Snow', # Percentage of snow cover (%)
                   'NDWI',      # Normalized Different Water Index (NDWI)
                   'PET',       # Potential ET (m)
                   'MODIS_PFT', # Plant Function Type
                   'MODIS_LC',  # MODIS Land Cover
                   'Ts',        # Skin temperature (K) ??
                   'LST_Day',   # Daytime land surface temperature (K)
                   'LST_Night', # Nightime land surface temperature (K)
                   'Lai',       # Leaf Area Index (LAI)
                   'Fpar',      # Fraction of photosynthetically active radiation (fPAR)
                   'CSIF-SIFdaily', # All-sky daily average SIF
                   'BESS-PAR',      # Photosynthetic Active Radiation (PAR) (W/m^2)
                   'BESS-PARdiff',  # Diffuse PAR (W/m^2)
                   'BESS-RSDN'      # Shortwave downwelling radiation (W/m^2)
                   ]
month_df = pd.read_csv(monthly_data_filename, usecols = included_features)

# only focus on target sites
month_df['date'] = pd.to_datetime(month_df['TIMESTAMP'],  format="%Y%m")
print(f"size:{month_df.shape}")
month_df.head()

size:(19015, 20)


Unnamed: 0,SITE_ID,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,MODIS_PFT,date
0,AR-SLu,2010,1,201001,154,40,336,0.20432,-0.01339,302.46967,0.15152,7,0.03542,0.0,0.49,1.2,313.84,293.58,SH,2010-01-01
1,AR-SLu,2010,2,201002,120,46,258,0.14553,-0.00894,298.78864,0.16656,7,0.0004,0.0,0.43,0.9,309.86,292.96,SH,2010-02-01
2,AR-SLu,2010,3,201003,107,31,231,0.1098,-0.00813,297.54816,0.16408,7,-0.02286,0.0,0.41,0.8,309.18,290.52,SH,2010-03-01
3,AR-SLu,2010,4,201004,81,27,175,0.07673,-0.00676,291.69604,0.12402,7,-0.04202,0.0,0.36,0.5,303.24,286.34,SH,2010-04-01
4,AR-SLu,2010,5,201005,56,19,122,0.06602,-0.00473,287.05652,0.14273,7,-0.01064,0.0,0.37,0.5,296.2,277.82,SH,2010-05-01


In [7]:
month_df[['date','TIMESTAMP']]

Unnamed: 0,date,TIMESTAMP
0,2010-01-01,201001
1,2010-02-01,201002
2,2010-03-01,201003
3,2010-04-01,201004
4,2010-05-01,201005
...,...,...
19010,2018-08-01,201808
19011,2018-09-01,201809
19012,2018-10-01,201810
19013,2018-11-01,201811


# Check NA

In [8]:
# Check_NA
month_df.isna().sum()

SITE_ID             0
year                0
month               0
TIMESTAMP           0
BESS-PAR            0
BESS-PARdiff        0
BESS-RSDN           0
CSIF-SIFdaily     121
PET               101
Ts                101
ESACCI-sm        1610
MODIS_LC            0
NDWI              406
Percent_Snow      143
Fpar              935
Lai               935
LST_Day             0
LST_Night           0
MODIS_PFT           0
date                0
dtype: int64

In [9]:
sites = month_df['SITE_ID'].unique()
sites

array(['AR-SLu', 'AR-Vir', 'AT-Neu', 'AU-ASM', 'AU-Ade', 'AU-Cpr',
       'AU-Cum', 'AU-DaP', 'AU-DaS', 'AU-Dry', 'AU-Emr', 'AU-Fog',
       'AU-Gin', 'AU-How', 'AU-RDF', 'AU-Rig', 'AU-Stp', 'AU-TTE',
       'AU-Tum', 'AU-Wac', 'AU-Whr', 'AU-Wom', 'AU-Ync', 'BR-Sa1',
       'BR-Sa3', 'CA-Man', 'CA-NS4', 'CA-NS7', 'CA-Oas', 'CA-Obs',
       'CA-SF1', 'CA-SF3', 'CA-TP1', 'CA-TP2', 'CA-TP3', 'CA-TPD',
       'CG-Tch', 'CH-Oe1', 'CN-Cha', 'CN-Cng', 'CN-Din', 'CN-Du2',
       'CN-Ha2', 'CN-HaM', 'CN-Qia', 'CN-Sw2', 'CZ-BK2', 'DE-Lkb',
       'DE-Lnf', 'DE-Seh', 'DE-SfN', 'DE-Spw', 'DK-Eng', 'ES-Amo',
       'ES-LgS', 'FI-Jok', 'FI-Lom', 'FI-Sod', 'FR-LBr', 'FR-Pue',
       'GH-Ank', 'GL-NuF', 'GL-ZaF', 'GL-ZaH', 'IT-CA1', 'IT-CA2',
       'IT-CA3', 'IT-Col', 'IT-Cpz', 'IT-La2', 'IT-Noe', 'IT-PT1',
       'IT-Ro1', 'IT-Ro2', 'IT-SRo', 'JP-MBF', 'JP-SMF', 'MY-PSO',
       'NL-Hor', 'PA-SPn', 'PA-SPs', 'RU-Che', 'RU-Cok', 'RU-Ha1',
       'SD-Dem', 'SJ-Adv', 'SN-Dhr', 'US-Atq', 'US-Blo', 'US-C

## Filln NAN's

In [10]:
pd.options.mode.chained_assignment = None
data_df = None
for i,s in enumerate(sites):
  site_df = month_df[month_df['SITE_ID'] == s]
  site_df = site_df.reset_index()
  site_df.set_index('date', inplace=True)

  if site_df.isna().sum().sum() != 0:
    pft = site_df['MODIS_PFT'][0]
    full_cols = site_df.columns[site_df.isna().sum() == 0]
    site_df = site_df.resample('M').mean()
    site_df[['year','month', 'TIMESTAMP']].interpolate(inplace=True)
    
    interpolate_fail = False
    try:
      site_df.interpolate(method='quadratic', limit_direction='backward', inplace=True)
    except:
      interpolate_fail = True
      #print(f"{s}:")
      #display(site_df)
    
    site_df.interpolate(method='linear', limit_direction='both', inplace=True)
    site_df = site_df.reset_index()
    site_df.set_index('date', inplace=True)
    site_df['SITE_ID'] = s
    site_df['MODIS_PFT'] = pft
  
  if site_df.isna().sum().sum() != 0:
    print(f"{s}:")
    display(site_df)

  site_df.drop("index", axis=1, inplace=True)

  if type(data_df) == type(None):
    data_df = site_df
  else:
    data_df = pd.concat([data_df, site_df])

pd.options.mode.chained_assignment = 'warn'

CA-TP3:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2003-05-31,1661.0,2003.0,5.0,200305.0,92.0,45.0,199.0,0.16003,-0.00319,288.54004,,12.0,0.04038,0.0,0.47,1.2,292.14,279.46,CA-TP3,CRO
2003-06-30,1660.98258,2003.18689,3.73957,200322.42835,72.27746,37.07305,156.74336,0.0671,-0.00171,279.80723,,12.0,-0.02729,15.33778,0.34694,0.62672,284.55783,272.55655,CA-TP3,CRO
2003-07-31,1660.99112,2003.35971,2.68094,200338.65232,55.4036,30.36063,120.55444,-0.01023,-0.00045,272.39225,,12.0,-0.0831,28.4625,0.24302,0.14995,278.12447,266.71675,CA-TP3,CRO
2003-08-31,1661.02663,2003.51192,1.87013,200353.06167,42.09331,25.15123,91.96437,-0.06855,0.00053,266.61256,,12.0,-0.12458,38.81821,0.16273,-0.2093,273.11564,262.19194,CA-TP3,CRO
2003-09-30,1661.08668,2003.63957,1.32142,200365.27847,32.60539,21.54095,71.53167,-0.1069,0.00122,262.57633,,12.0,-0.15106,46.20342,0.10753,-0.44507,269.62471,259.06513,CA-TP3,CRO
2003-10-31,1661.17527,2003.75119,0.99823,200376.11716,26.30731,19.28909,57.89415,-0.12784,0.00166,260.01448,,12.0,-0.16432,51.11047,0.07374,-0.57308,267.41896,257.12786,CA-TP3,CRO
2003-11-30,1661.28668,2003.83957,0.92142,200384.87847,23.60539,18.54095,51.93167,-0.13001,0.00182,259.09228,,12.0,-0.1635,53.22278,0.06353,-0.58507,266.64071,256.50513,CA-TP3,CRO
2003-12-31,1661.42835,2003.91061,1.08586,200392.14649,24.31951,19.24664,53.24671,-0.11355,0.00172,259.74826,,12.0,-0.14855,52.68116,0.07623,-0.48184,267.23806,257.15541,CA-TP3,CRO
2004-01-31,1661.59698,2003.96102,1.49811,200397.59991,28.59721,21.45534,62.1606,-0.07809,0.00134,262.03953,,12.0,-0.11925,49.37055,0.11256,-0.26109,269.25993,259.12067,CA-TP3,CRO
2004-02-29,1661.77916,2003.98951,2.10811,200401.05872,35.82506,24.88224,77.37868,-0.02772,0.00074,265.66342,,12.0,-0.07886,43.76673,0.16794,0.0518,272.44099,262.14961,CA-TP3,CRO


CG-Tch:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2006-07-31,1788.0,2006.0,7.0,200607.0,60.0,40.0,129.0,0.03219,-0.0042,296.46918,0.16134,9.0,,0.0,0.19,0.5,307.58,289.8,CG-Tch,SA
2006-08-31,1789.0,2006.0,8.0,200608.0,57.0,39.0,122.0,0.0,-0.00425,296.37665,0.17328,9.0,,0.0,0.16,0.4,310.36,290.1,CG-Tch,SA
2006-09-30,1790.0,2006.0,9.0,200609.0,58.0,46.0,115.0,0.0,-0.00432,297.62463,0.23372,9.0,,0.0,0.15,0.4,315.78,290.98,CG-Tch,SA
2006-10-31,1791.0,2006.0,10.0,200610.0,60.0,47.0,114.0,0.02433,-0.00522,299.12616,0.28374,9.0,,0.0,0.21,0.5,305.02,293.06,CG-Tch,SA
2006-11-30,1792.0,2006.0,11.0,200611.0,87.0,54.0,168.0,0.1681,-0.00427,298.8112,0.25753,9.0,,0.0,0.43,1.3,306.76,293.6,CG-Tch,SA
2006-12-31,1793.0,2006.0,12.0,200612.0,82.0,52.0,163.0,0.23642,-0.004,298.67575,0.27133,9.0,,0.0,0.53,1.7,301.14,295.3,CG-Tch,SA
2007-01-31,1793.64278,2006.0605,12.27972,200618.32924,74.12018,48.32427,152.25139,0.26271,-0.00396,298.4565,0.28009,9.0,,0.0,0.56524,1.84537,296.23787,296.25233,CG-Tch,SA
2007-02-28,1793.87054,2006.17608,11.8138,200629.42158,70.64176,45.15942,149.07437,0.26177,-0.00397,298.08646,0.27355,9.0,,0.0,0.5588,1.81616,294.29362,296.10819,CG-Tch,SA
2007-03-31,1793.73208,2006.37152,10.50241,200647.65396,70.81937,41.82727,152.78814,0.23342,-0.00404,297.48633,0.25032,9.0,,0.0,0.5093,1.60609,294.89061,294.83669,CG-Tch,SA
2007-04-30,1793.29097,2006.61369,8.6079,200669.97707,74.15636,38.90591,161.76467,0.182,-0.00414,296.76831,0.21472,9.0,,0.0,0.42402,1.25,297.91342,292.6921,CG-Tch,SA


GL-ZaF:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2009-09-30,2989.0,2009.0,9.0,200909.0,28.0,14.0,61.0,0.01663,2e-05,257.92456,,10.0,-0.13542,38.86666,0.21,0.3,272.08,264.14,GL-ZaF,GRA
2009-10-31,2988.26572,2009.16127,8.10123,200924.22778,42.25899,21.78404,89.99848,0.05454,0.0,267.13747,,10.0,-0.12666,-22.23168,0.19908,0.28374,284.46164,272.67613,GL-ZaF,GRA
2009-11-30,2987.69991,2009.30384,7.3903,200937.77405,53.43275,27.91118,112.68106,0.08484,-1e-05,274.48296,,10.0,-0.11966,-70.91764,0.18953,0.26937,294.2612,279.47052,GL-ZaF,GRA
2009-12-31,2987.26487,2009.43722,6.81982,200950.54187,62.2662,32.7899,130.55989,0.10954,-2e-05,280.45073,,10.0,-0.11396,-110.43697,0.18074,0.25594,302.132,284.97615,GL-ZaF,GRA
2010-01-31,2986.98189,2009.55643,6.41618,200962.05956,68.34242,36.19214,142.78776,0.12754,-3e-05,284.76934,,10.0,-0.1098,-138.98991,0.17302,0.24396,307.7104,288.94168,GL-ZaF,GRA
2010-02-28,2986.857,2009.65193,6.19501,200971.38811,71.46071,37.99608,148.97515,0.13802,-3e-05,287.25252,,10.0,-0.10737,-155.35383,0.16699,0.23437,310.77858,291.19971,GL-ZaF,GRA
2010-03-31,2986.86344,2009.74418,6.1089,200980.52649,72.28928,38.58827,150.44794,0.14324,-3e-05,288.4324,,10.0,-0.10616,-163.03527,0.16133,0.22514,311.99403,292.2341,GL-ZaF,GRA
2010-04-30,2987.01447,2009.81995,6.18442,200988.17979,70.46586,37.75555,146.49275,0.1419,-3e-05,288.00398,,10.0,-0.10647,-160.02746,0.15689,0.21757,310.9876,291.76876,GL-ZaF,GRA
2010-05-31,2987.32015,2009.88432,6.4266,200994.85822,65.8689,35.44242,136.8459,0.13392,-3e-05,285.93872,,10.0,-0.10831,-146.12988,0.15337,0.21117,307.6922,289.77265,GL-ZaF,GRA
2010-06-30,2987.76076,2009.93311,6.81982,201000.13091,58.79497,31.79811,122.12975,0.1198,-3e-05,282.36985,,10.0,-0.11156,-122.23916,0.15098,0.20635,302.32044,286.37456,GL-ZaF,GRA


GL-ZaH:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2001-07-31,2994.0,2001.0,7.0,200107.0,91.0,49.0,197.0,0.11941,0.0,269.7281,,10.0,-0.03364,4.77419,0.3,0.5,285.06,277.26,GL-ZaH,GRA
2001-08-31,2995.0,2001.0,8.0,200108.0,60.0,27.0,130.0,0.09478,-1e-05,268.6928,,10.0,-0.09898,0.0,0.3,0.4,286.78,273.86,GL-ZaH,GRA
2001-09-30,2995.69188,2001.02826,8.63505,200111.46064,40.25344,12.72359,87.26742,0.07797,-2e-05,268.2853,,10.0,-0.1422,-3.45533,0.29925,0.32595,288.34815,271.76165,GL-ZaH,GRA
2001-10-31,2996.12178,2001.08665,8.94749,200117.61262,30.44388,5.219,65.95341,0.06787,-2e-05,268.47843,,10.0,-0.16618,-5.82216,0.2977,0.27292,289.86898,270.82505,GL-ZaH,GRA
2001-11-30,2996.26194,2001.17142,8.91717,200126.05905,31.2042,4.9704,67.43308,0.06512,-2e-05,269.25974,,10.0,-0.16939,-6.94779,0.29545,0.24433,291.24439,271.11064,GL-ZaH,GRA
2001-12-31,2996.12172,2001.28821,8.54205,200137.36302,42.58508,11.96122,91.80507,0.06955,-2e-05,270.6813,,10.0,-0.15203,-6.90725,0.29235,0.23827,292.56606,272.63745,GL-ZaH,GRA
2002-01-31,2995.69178,2001.43468,7.81751,200151.28521,64.73488,26.31856,139.39453,0.08137,-1e-05,272.72715,,10.0,-0.11366,-5.64329,0.28846,0.25608,293.78651,275.41615,GL-ZaH,GRA
2002-02-28,2995.11488,2001.58628,6.93578,200165.56343,91.73387,44.13376,197.45866,0.09706,-0.0,274.93283,,10.0,-0.06484,-3.63397,0.28449,0.28961,294.72349,278.72836,GL-ZaH,GRA
2002-03-31,2994.6977,2001.73136,6.22754,200179.36352,113.2583,58.65936,243.73691,0.11054,0.0,276.49863,,10.0,-0.02291,-1.75729,0.28107,0.32422,295.01997,281.33637,GL-ZaH,GRA
2002-04-30,2994.58262,2001.84212,5.89114,200190.1034,123.20924,65.87085,265.10425,0.11822,1e-05,276.93919,,10.0,0.00123,-0.49295,0.27897,0.35179,294.47877,282.49749,GL-ZaH,GRA


IT-Cpz:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2001-01-31,3220.0,2001.0,1.0,200101.0,29.0,14.0,62.0,0.11072,-0.00257,283.3021,,9.0,0.18479,0.0,0.59,1.2,285.16,278.6,IT-Cpz,SA
2001-02-28,3221.0,2001.0,2.0,200102.0,42.0,21.0,90.0,0.12287,-0.00342,282.60922,,9.0,0.16638,0.0,0.61,1.4,285.58,277.96,IT-Cpz,SA
2001-03-31,3221.51511,2000.99999,3.03537,200103.03441,73.65677,31.3118,161.5198,0.18602,-0.00465,283.36826,,9.0,0.18471,0.0,0.63623,1.86841,287.97986,278.02013,IT-Cpz,SA
2001-04-30,3222.0,2001.0,4.0,200104.0,104.0,42.0,230.0,0.25549,-0.00538,286.68094,,9.0,0.20585,0.0,0.64,2.2,292.48,280.88,IT-Cpz,SA
2001-05-31,3223.0,2001.0,5.0,200105.0,122.0,50.0,268.0,0.28817,-0.00558,292.86157,,9.0,0.19009,0.0,0.61,2.2,298.92,287.26,IT-Cpz,SA
2001-06-30,3224.0,2001.0,6.0,200106.0,147.0,46.0,316.0,0.25597,-0.00824,296.35724,,9.0,0.11861,0.0,0.62,2.6,303.08,289.02,IT-Cpz,SA
2001-07-31,3224.52935,2001.0021,6.99504,200107.20519,152.13025,41.25743,323.66057,0.21379,-0.00907,298.29078,,9.0,0.06323,0.0,0.63026,2.73269,305.71523,289.96338,IT-Cpz,SA
2001-08-31,3224.46856,2001.0067,7.93809,200108.60765,130.74246,38.12309,278.2876,0.17303,-0.00708,298.82423,,9.0,0.04027,0.0,0.6314,2.43997,306.85491,290.8769,IT-Cpz,SA
2001-09-30,3224.43154,2001.00786,8.88925,200109.67491,98.26195,34.00243,210.64353,0.13729,-0.00458,297.21552,,9.0,0.04119,0.0,0.62456,1.99213,304.9086,290.31952,IT-Cpz,SA
2001-10-31,3225.0,2001.0,10.0,200110.0,66.0,26.0,143.0,0.1065,-0.00349,292.56488,,9.0,0.0583,0.0,0.61,1.6,298.12,286.84,IT-Cpz,SA


IT-Noe:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2004-05-31,3300.0,2004.0,5.0,200405.0,116.0,47.0,254.0,0.14687,,,,17.0,0.19579,0.0,0.55,1.8,294.04,285.2,IT-Noe,Other
2004-06-30,3301.0,2004.0,6.0,200406.0,148.0,41.0,327.0,0.13286,,,,17.0,0.12694,0.0,0.58,2.1,302.76,289.94,IT-Noe,Other
2004-07-31,3302.0,2004.0,7.0,200407.0,144.0,41.0,318.0,0.10294,,,,17.0,0.08755,0.0,0.53,1.7,305.56,292.26,IT-Noe,Other
2004-08-31,3303.0,2004.0,8.0,200408.0,126.0,38.0,275.0,0.0757,,,,17.0,0.06115,0.0,0.51,1.6,305.04,293.58,IT-Noe,Other
2004-09-30,3304.0,2004.0,9.0,200409.0,92.0,38.0,199.0,0.06714,,,,17.0,0.08971,0.0,0.51,1.3,301.66,291.08,IT-Noe,Other
2004-10-31,3305.0,2004.0,10.0,200410.0,67.0,25.0,144.0,0.05535,,,,17.0,0.13705,0.0,0.51,1.1,296.7,290.36,IT-Noe,Other
2004-11-30,3305.45244,2004.2508,7.94446,200433.02428,47.44352,15.31193,101.79222,0.05149,,,,17.0,0.18392,0.0,0.52528,1.09661,292.30761,288.24251,IT-Noe,Other
2004-12-31,3305.45905,2004.74141,3.04496,200477.18586,31.83249,11.571,68.92866,0.05662,,,,17.0,0.22883,0.0,0.5575,1.26113,288.50744,284.16122,IT-Noe,Other
2005-01-31,3306.0,2005.0,1.0,200501.0,31.0,14.0,68.0,0.06293,,,,17.0,0.2508,0.0,0.59,1.4,285.66,280.36,IT-Noe,Other
2005-02-28,3307.0,2005.0,2.0,200502.0,45.0,21.0,99.0,0.07005,,,,17.0,0.24347,0.0,0.61,1.5,284.56,278.14,IT-Noe,Other


US-KS2:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2003-05-31,4566.0,2003.0,5.0,200305.0,128.0,55.0,275.0,0.31656,-0.00806,299.7295,,8.0,0.20265,0.0,0.69,3.4,304.82,294.86,US-KS2,SA
2003-06-30,4567.0,2003.0,6.0,200306.0,109.0,53.0,231.0,0.35113,-0.00735,300.12415,,8.0,0.18487,0.0,0.63,2.9,302.26,295.48,US-KS2,SA
2003-07-31,4567.46874,2003.00098,7.00972,200307.10821,100.81272,51.97147,210.72841,0.33742,-0.0067,300.38874,,8.0,0.1887,0.0,0.59488,2.60971,301.1437,295.45918,US-KS2,SA
2003-08-31,4567.51903,2003.00226,8.00434,200308.23069,101.5163,51.14776,210.54671,0.28133,-0.00625,300.38127,,8.0,0.21062,0.0,0.59005,2.53617,301.15988,294.81019,US-KS2,SA
2003-09-30,4568.0,2003.0,9.0,200309.0,96.0,46.0,200.0,0.22888,-0.00657,299.43878,,8.0,0.22516,0.0,0.63,2.6,300.0,293.82,US-KS2,SA
2003-10-31,4569.0,2003.0,10.0,200310.0,83.0,36.0,176.0,0.18593,-0.00745,297.60236,,8.0,0.23185,0.0,0.7,2.7,297.94,292.36,US-KS2,SA
2003-11-30,4570.0,2003.0,11.0,200311.0,71.0,26.0,152.0,0.16559,-0.00724,295.50998,,8.0,0.23908,0.0,0.7,2.4,297.78,289.34,US-KS2,SA
2003-12-31,4571.0,2003.0,12.0,200312.0,59.0,22.0,126.0,0.14871,-0.00718,290.4204,,8.0,0.22089,0.0,0.71,2.2,293.1,282.62,US-KS2,SA
2004-01-31,4572.0,2004.0,1.0,200401.0,66.0,24.0,143.0,0.14039,-0.00617,290.3492,,8.0,0.19538,0.0,0.66,2.0,293.3,282.32,US-KS2,SA
2004-02-29,4573.0,2004.0,2.0,200402.0,67.0,32.0,142.0,0.1478,-0.00583,291.01395,,8.0,0.16738,0.0,0.57,1.9,294.44,283.02,US-KS2,SA


CA-Ca3:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2001-10-31,6710.0,2001.0,10.0,200110.0,37.0,18.0,79.0,0.16624,-0.00601,279.852,,1.0,0.38775,0.0,0.79,2.7,282.28,276.84,CA-Ca3,ENF
2001-11-30,6711.0,2001.0,11.0,200111.0,18.0,10.0,40.0,0.10636,-0.00306,277.2843,,1.0,0.39524,12.43333,0.78,2.5,276.82,273.4,CA-Ca3,ENF
2001-12-31,6712.0,2001.0,12.0,200112.0,12.0,7.0,26.0,0.07395,-0.00173,273.24756,,1.0,0.52622,42.32258,0.56783,1.1877,271.28,270.02,CA-Ca3,ENF
2002-01-31,6713.0,2002.0,1.0,200201.0,16.0,9.0,36.0,0.10019,-0.00191,273.41846,,1.0,0.4798,20.48387,0.49,0.7,272.6,269.4,CA-Ca3,ENF
2002-02-28,6714.0,2002.0,2.0,200202.0,30.0,15.0,65.0,0.12846,-0.00413,273.65863,,1.0,0.37833,8.03571,0.73,2.1,276.08,270.7,CA-Ca3,ENF
2002-03-31,6715.0,2002.0,3.0,200203.0,48.0,29.0,103.0,0.15874,-0.00603,273.4982,,1.0,0.31376,0.0,0.72,2.2,271.46,267.94,CA-Ca3,ENF
2002-04-30,6716.0,2002.0,4.0,200204.0,81.0,35.0,178.0,0.19565,-0.0115,278.17673,,1.0,0.26475,0.0,0.73,2.5,282.4,274.86,CA-Ca3,ENF
2002-05-31,6717.0,2002.0,5.0,200205.0,89.0,48.0,193.0,0.2905,-0.0148,281.19952,,1.0,0.26674,0.0,0.81,3.7,285.6,277.48,CA-Ca3,ENF
2002-06-30,6718.0,2002.0,6.0,200206.0,119.0,50.0,262.0,0.43044,-0.02037,286.6667,,1.0,0.35604,0.0,0.77,3.4,291.48,283.32,CA-Ca3,ENF
2002-07-31,6719.0,2002.0,7.0,200207.0,120.0,45.0,261.0,0.44223,-0.02164,289.43497,,1.0,0.38986,0.0,0.81,3.7,293.08,285.6,CA-Ca3,ENF


CA-TP4:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2003-05-31,7306.0,2003.0,5.0,200305.0,91.0,44.0,196.0,0.18747,-0.00636,286.51074,,12.0,0.02623,0.0,0.44,1.1,295.5,279.24,CA-TP4,CRO
2003-06-30,7307.0,2003.0,6.0,200306.0,116.0,49.0,254.0,0.30129,-0.00883,292.83313,,12.0,0.1344,0.0,0.58,1.9,300.84,285.72,CA-TP4,CRO
2003-07-31,7308.0,2003.0,7.0,200307.0,103.0,49.0,221.0,0.36174,-0.00891,296.065,,12.0,0.17368,0.0,0.61,2.0,303.36,287.24,CA-TP4,CRO
2003-08-31,7309.0,2003.0,8.0,200308.0,96.0,48.0,207.0,0.35646,-0.00712,296.40552,,12.0,0.20007,0.0,0.66,2.4,300.64,288.44,CA-TP4,CRO
2003-09-30,7310.0,2003.0,9.0,200309.0,81.0,36.0,176.0,0.25144,-0.00747,291.5208,,12.0,0.17321,0.0,0.63,1.9,296.58,283.02,CA-TP4,CRO
2003-10-31,7311.0,2003.0,10.0,200310.0,47.0,23.0,103.0,0.13977,-0.00565,283.77228,,12.0,0.08808,0.0,0.51,1.0,289.56,280.64,CA-TP4,CRO
2003-11-30,7312.0,2003.0,11.0,200311.0,27.0,14.0,58.0,0.06687,-0.00381,279.88693,,12.0,6e-05,12.46667,0.35,0.5,282.22,272.16,CA-TP4,CRO
2003-12-31,7313.0,2003.0,12.0,200312.0,21.0,12.0,46.0,0.03949,-0.00341,273.92236,,12.0,-0.01953,49.83871,0.35,0.6,273.16,266.68,CA-TP4,CRO
2004-01-31,7314.0,2004.0,1.0,200401.0,27.0,15.0,58.0,0.00959,-0.00208,265.64413,,12.0,0.02648,88.90323,0.29,0.4,264.1,257.44,CA-TP4,CRO
2004-02-29,7315.0,2004.0,2.0,200402.0,48.0,25.0,104.0,-0.00402,-0.00167,268.22098,,12.0,0.68682,99.17242,0.22,0.3,270.0,261.04,CA-TP4,CRO


FI-Qvd:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2018-06-30,15503.0,2018.0,6.0,201806.0,116.0,46.0,252.0,,-0.02496,288.94205,0.30284,8.0,0.24048,0.0,0.67,2.2,295.8,281.4,FI-Qvd,SA
2018-07-31,15504.0,2018.0,7.0,201807.0,103.0,46.0,220.0,,-0.02019,294.27423,0.30384,8.0,0.26992,0.0,0.76,2.8,299.44,286.8,FI-Qvd,SA
2018-08-31,15505.0,2018.0,8.0,201808.0,80.0,38.0,174.0,,-0.01832,291.62878,0.3088,8.0,0.22941,0.0,0.69,2.2,294.48,285.5,FI-Qvd,SA
2018-09-30,15506.0,2018.0,9.0,201809.0,45.0,24.0,96.0,,-0.01388,286.92654,0.30124,8.0,0.23919,0.0,0.7,1.8,288.66,281.36,FI-Qvd,SA
2018-10-31,15507.0,2018.0,10.0,201810.0,22.0,11.0,47.0,,-0.00598,280.45117,0.32059,8.0,0.25041,0.0,0.6,1.2,280.9,276.64,FI-Qvd,SA
2018-11-30,15508.0,2018.0,11.0,201811.0,5.0,3.0,12.0,,-0.00359,276.95148,0.32379,8.0,0.24013,1.42857,0.50553,0.74879,276.0,271.64,FI-Qvd,SA
2018-12-31,15509.0,2018.0,12.0,201812.0,2.0,1.0,4.0,,-0.00263,272.14746,0.32882,8.0,0.19926,2.26878,0.43683,0.49026,267.08,266.5,FI-Qvd,SA
2019-01-31,15509.51844,2018.16686,11.01671,201827.70267,10.8358,3.77973,23.00561,,-0.00348,270.38456,0.34016,8.0,0.12654,2.05811,0.39755,0.44274,264.7208,264.22355,FI-Qvd,SA
2019-02-28,15509.50865,2018.48566,8.13768,201856.70398,28.266,10.13374,62.62244,,-0.00599,272.15645,0.35264,8.0,0.04447,1.12634,0.38966,0.53054,269.96514,265.03471,FI-Qvd,SA
2019-03-31,15509.48945,2018.84157,4.91528,201889.07277,52.20242,19.52194,116.66231,,-0.00953,275.92745,0.34773,8.0,0.00823,0.34682,0.41378,0.72146,279.1949,268.0811,FI-Qvd,SA


FR-FBn:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2008-02-29,15891.0,2008.0,2.0,200802.0,49.0,21.0,109.0,0.09429,-0.00254,281.2051,,1.0,0.16771,0.0,0.6,1.3,285.88,277.72,FR-FBn,ENF
2008-03-31,15892.0,2008.0,3.0,200803.0,79.0,30.0,177.0,0.11121,-0.00647,282.84027,,1.0,0.13327,0.0,0.54,1.3,287.28,278.64,FR-FBn,ENF
2008-04-30,15893.0,2008.0,4.0,200804.0,101.0,37.0,224.0,0.14959,-0.00632,285.4397,,1.0,0.1163,0.0,0.56,1.6,293.36,279.96,FR-FBn,ENF
2008-05-31,15894.0,2008.0,5.0,200805.0,105.0,48.0,232.0,0.19177,-0.00621,290.27386,,1.0,0.13655,0.0,0.53,1.6,295.68,284.34,FR-FBn,ENF
2008-06-30,15895.0,2008.0,6.0,200806.0,138.0,49.0,304.0,0.21484,-0.00804,294.40692,,1.0,0.1436,0.0,0.59,1.9,301.02,288.54,FR-FBn,ENF
2008-07-31,15896.0,2008.0,7.0,200807.0,144.0,41.0,317.0,0.19076,-0.0091,297.53937,,1.0,0.12292,0.0,0.57,1.7,304.52,290.42,FR-FBn,ENF
2008-08-31,15897.0,2008.0,8.0,200808.0,122.0,39.0,268.0,0.16225,-0.00835,297.66684,,1.0,0.11727,0.0,0.54,1.6,305.4,290.58,FR-FBn,ENF
2008-09-30,15898.0,2008.0,9.0,200809.0,74.0,34.0,162.0,0.13362,-0.00636,293.17603,,1.0,0.14065,0.0,0.54,1.3,297.68,286.8,FR-FBn,ENF
2008-10-31,15899.0,2008.0,10.0,200810.0,53.0,23.0,116.0,0.10877,-0.00409,289.0178,,1.0,0.17677,0.0,0.54,1.0,293.26,285.04,FR-FBn,ENF
2008-11-30,15900.0,2008.0,11.0,200811.0,32.0,15.0,71.0,0.09651,-0.00325,283.61383,,1.0,0.21426,0.0,0.6,1.3,285.46,278.98,FR-FBn,ENF


GF-Guy:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2015-01-31,16662.0,2015.0,1.0,201501.0,70.0,51.0,137.0,0.24654,-0.01791,297.8203,,2.0,0.26299,0.0,0.74,3.8,298.98,292.78,GF-Guy,EBF
2015-02-28,16663.0,2015.0,2.0,201502.0,85.0,57.0,167.0,0.34187,-0.02408,298.22382,,2.0,0.26299,0.0,0.82,4.9,299.1,293.1,GF-Guy,EBF
2015-03-31,16664.0,2015.0,3.0,201503.0,79.0,57.0,153.0,0.40645,-0.02521,298.3366,,2.0,0.26299,0.0,0.79,4.6,299.84,293.44,GF-Guy,EBF
2015-04-30,16665.0,2015.0,4.0,201504.0,89.0,58.0,177.0,0.3948,-0.02871,298.7116,,2.0,0.26299,0.0,0.75,3.9,300.6,290.26,GF-Guy,EBF
2015-05-31,16666.0,2015.0,5.0,201505.0,73.0,52.0,143.0,0.34743,-0.01804,298.25592,,2.0,0.26299,0.0,0.74,3.8,299.68,291.74,GF-Guy,EBF
2015-06-30,16667.0,2015.0,6.0,201506.0,99.0,52.0,198.0,0.34509,-0.01309,298.20258,,2.0,0.29803,0.0,0.8,4.7,299.08,293.82,GF-Guy,EBF
2015-07-31,16668.0,2015.0,7.0,201507.0,105.0,53.0,213.0,0.34722,-0.01564,298.73413,,2.0,0.31391,0.0,0.85,5.2,299.72,293.68,GF-Guy,EBF
2015-08-31,16669.0,2015.0,8.0,201508.0,114.0,50.0,235.0,0.38614,-0.01962,299.38684,,2.0,0.30912,0.0,0.86,5.6,301.18,294.02,GF-Guy,EBF
2015-09-30,16670.0,2015.0,9.0,201509.0,121.0,51.0,252.0,0.45057,-0.02886,300.35114,,2.0,0.3123,0.0,0.84,5.5,303.14,294.96,GF-Guy,EBF
2015-10-31,16670.52576,2015.0,10.02315,201510.02315,122.45494,49.84329,254.76274,0.4351,-0.02796,300.40063,,2.0,0.33487,0.0,0.85988,5.62541,303.00958,295.10241,GF-Guy,EBF


IT-Cp2:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2012-05-31,17019.0,2012.0,5.0,201205.0,127.0,42.0,280.0,0.28853,-0.00615,291.1674,,9.0,0.20719,0.0,0.65,2.5,299.52,283.88,IT-Cp2,SA
2012-06-30,17018.62515,2011.97662,6.24374,201203.90548,125.16682,41.21546,276.26348,0.2694,-0.00625,293.68548,,9.0,0.1626,-0.19205,0.72478,2.96602,303.45786,287.61386,IT-Cp2,SA
2012-07-31,17018.53039,2011.96444,7.39399,201203.8378,117.78103,38.99811,259.9481,0.24849,-0.00606,295.02073,,9.0,0.13901,-0.29208,0.77178,3.19871,305.17938,289.81393,IT-Cp2,SA
2012-08-31,17018.733,2011.96444,8.40706,201204.85087,104.81371,35.35105,230.97425,0.22641,-0.00557,295.06845,,9.0,0.13826,-0.29208,0.78799,3.17844,304.5148,290.32857,IT-Cp2,SA
2012-09-30,17019.21223,2011.97603,9.25685,201206.86029,86.95033,30.46036,190.88248,0.20394,-0.00482,293.88872,,9.0,0.1593,-0.19684,0.77436,2.918,301.59979,289.22186,IT-Cp2,SA
2012-10-31,17020.0,2012.0,10.0,201210.0,63.0,24.0,137.0,0.17958,-0.00375,291.4029,,9.0,0.20352,0.0,0.73,2.4,296.24,286.42,IT-Cp2,SA
2012-11-30,17021.0,2012.0,11.0,201211.0,38.0,17.0,81.0,0.15467,-0.00271,287.53882,,9.0,0.25318,0.2,0.67,1.8,289.38,281.74,IT-Cp2,SA
2012-12-31,17022.0,2012.0,12.0,201212.0,30.0,13.0,65.0,0.12789,-0.00287,281.92047,,9.0,0.23199,0.0,0.66,1.8,284.72,274.7,IT-Cp2,SA
2013-01-31,17023.0,2013.0,1.0,201301.0,32.0,14.0,70.0,0.11325,-0.00218,281.2712,,9.0,0.20616,0.0,0.66,1.6,284.76,275.46,IT-Cp2,SA
2013-02-28,17024.0,2013.0,2.0,201302.0,49.0,21.0,108.0,0.12469,-0.00309,280.6173,,9.0,0.17889,0.0,0.62,1.5,286.04,274.26,IT-Cp2,SA


DE-Hte:


Unnamed: 0_level_0,index,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night,SITE_ID,MODIS_PFT
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
2009-01-31,18679.0,2009.0,1.0,200901.0,10.0,6.0,21.0,,-0.00095,272.89047,0.31022,17.0,0.17859,13.80645,0.29,0.4,274.12,268.3,DE-Hte,Other
2009-02-28,18680.0,2009.0,2.0,200902.0,15.0,10.0,31.0,,-0.00117,273.56256,0.30168,17.0,0.12921,8.0,0.33,0.5,273.34,268.48,DE-Hte,Other
2009-03-31,18681.0,2009.0,3.0,200903.0,40.0,22.0,89.0,,-0.00257,277.50446,0.30312,17.0,0.0499,0.0,0.36,0.6,279.58,272.1,DE-Hte,Other
2009-04-30,18682.0,2009.0,4.0,200904.0,95.0,34.0,212.0,,-0.00561,283.94714,0.24812,17.0,0.07131,0.0,0.59,1.6,290.28,278.16,DE-Hte,Other
2009-05-31,18683.0,2009.0,5.0,200905.0,105.0,43.0,229.0,,-0.00659,286.09286,0.22195,17.0,0.24402,0.0,0.76,3.3,289.58,281.16,DE-Hte,Other
2009-06-30,18684.0,2009.0,6.0,200906.0,101.0,50.0,218.0,,-0.00705,287.8319,0.24192,17.0,0.33423,0.0,0.78,4.0,289.84,283.92,DE-Hte,Other
2009-07-31,18684.77801,2009.02561,6.72679,200909.28788,92.91714,55.34794,198.76421,,-0.00723,288.84006,0.26265,17.0,0.38471,0.03215,0.75594,4.26686,290.06439,285.79577,DE-Hte,Other
2009-08-31,18685.24482,2009.08162,7.08157,200915.24373,81.17444,58.69778,171.66553,,-0.00706,288.81109,0.27555,17.0,0.40504,0.05405,0.70513,4.20552,289.60937,286.41603,DE-Hte,Other
2009-09-30,18685.40026,2009.16477,7.0707,200923.54773,66.32588,60.03711,137.95446,,-0.00658,287.79556,0.28057,17.0,0.39601,0.06549,0.6305,3.83367,288.52214,285.82086,DE-Hte,Other
2009-10-31,18685.2547,2009.2806,6.69347,200934.75346,47.38157,59.45521,95.38362,,-0.00574,285.72577,0.27804,17.0,0.35702,0.06723,0.52706,3.12651,286.7302,283.97059,DE-Hte,Other


In [11]:
data_df.isna().sum()

SITE_ID             0
year                0
month               0
TIMESTAMP           0
BESS-PAR            0
BESS-PARdiff        0
BESS-RSDN           0
CSIF-SIFdaily     150
PET               125
Ts                125
ESACCI-sm        1144
MODIS_LC            0
NDWI               42
Percent_Snow        0
Fpar                0
Lai                 0
LST_Day             0
LST_Night           0
MODIS_PFT           0
dtype: int64

In [12]:
# Save interpolated monthly data checkpoint
data_df.to_csv(interpolated_monthly_data_filename);

# Feature EDA

In [13]:
month_df.describe()

Unnamed: 0,year,month,TIMESTAMP,BESS-PAR,BESS-PARdiff,BESS-RSDN,CSIF-SIFdaily,PET,Ts,ESACCI-sm,MODIS_LC,NDWI,Percent_Snow,Fpar,Lai,LST_Day,LST_Night
count,19015.0,19015.0,19015.0,19015.0,19015.0,19015.0,18894.0,18914.0,18914.0,17405.0,19015.0,18609.0,18872.0,18080.0,18080.0,19015.0,19015.0
mean,2010.62682,6.59085,201069.27294,79.33305,33.84565,157.84491,0.15174,-0.00731,283.59837,0.25658,7.97002,0.16576,11.62064,0.48448,1.43052,289.81701,277.19649
std,5.1509,3.38791,515.04368,59.94865,24.61444,87.69293,0.1402,0.00683,10.691,0.06502,3.77654,0.19989,26.68487,0.19973,1.12848,13.73765,9.70005
min,2001.0,1.0,200101.0,0.0,0.0,0.0,-0.0292,-0.05543,239.46857,1e-05,1.0,-0.2762,0.0,0.06,0.1,238.54,237.9
25%,2006.0,4.0,200612.0,39.0,18.0,81.0,0.04175,-0.00914,276.33478,0.21682,5.0,0.02816,0.0,0.33,0.5,280.38,271.24
50%,2011.0,7.0,201103.0,77.0,32.0,163.0,0.10285,-0.00554,284.15315,0.26504,9.0,0.1697,0.0,0.5,1.1,290.9,277.92
75%,2015.0,10.0,201502.0,106.0,45.0,225.0,0.23512,-0.00262,290.97623,0.30111,11.0,0.28347,1.17136,0.65,2.1,298.46,284.18
max,2020.0,12.0,202012.0,611.0,241.0,373.0,0.70735,4e-05,310.28552,0.42007,17.0,0.85476,100.0,0.91,6.3,328.28,299.34


In [14]:
# used data with all features
month_df = pd.read_csv(monthly_data_filename, usecols=['SITE_ID', 'SITE_IGBP', 'MODIS_IGBP', 'MODIS_LC'])
group_df = month_df.groupby('SITE_ID').first()
print(f"size:{group_df.shape}")
tmp_df = group_df[group_df['SITE_IGBP'] != group_df['MODIS_IGBP']][['SITE_IGBP', 'MODIS_IGBP', 'MODIS_LC']]
print(f"size:{tmp_df.shape}")
tmp_df

size:(243, 3)
size:(162, 3)


Unnamed: 0_level_0,SITE_IGBP,MODIS_IGBP,MODIS_LC
SITE_ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
AR-SLu,MF,OSH,7
AR-Vir,ENF,SAV,9
AT-Neu,GRA,MF,5
AU-ASM,SAV,CSH,6
AU-Ade,WSA,GRA,10
AU-Cpr,SAV,CSH,6
AU-Cum,EBF,SAV,9
AU-DaS,SAV,GRA,10
AU-Dry,SAV,GRA,10
AU-Fog,WET,GRA,10
