# Check data structures and attributes for all dataset files

In [None]:
import os
import glob
import xarray as xr
import geopandas as gpd
import pandas as pd
import json
from tqdm import tqdm

In [None]:
# Define path to dataset
data_path = '/Volumes/LaCie/raineyaberle/Research/PhD/snow_cover_mapping/dataset'

In [None]:
### AOIs
aois_fn = os.path.join(data_path, 'analysis', 'AOIs.gpkg')
aois = gpd.read_file(aois_fn)
print('Longitude range:', aois['CenLon'].min(), aois['CenLon'].max())
print('Latitude range:', aois['CenLat'].min(), aois['CenLat'].max())
aois

## Analyses

In [None]:
## Climate clusters
clusters_fn = os.path.join(data_path, 'analysis', 'climate_clusters.csv')
clusters = pd.read_csv(clusters_fn)
clusters

In [None]:
## Median snow cover stats
scs_mc_fn = os.path.join(data_path, 'analysis', 'median_snow_cover_stats_MC.nc')
scs_mc = xr.open_dataset(scs_mc_fn)
scs_mc

In [None]:
## melt season timing
ms_timing_fn = os.path.join(data_path, 'analysis', 'melt_season_timing.csv')
ms_timing = pd.read_csv(ms_timing_fn)
ms_timing

In [None]:
## minimum snow cover stats
min_scs_fn = os.path.join(data_path, 'analysis', 'minimum_snow_cover_stats.csv')
min_scs = pd.read_csv(min_scs_fn)
min_scs

In [None]:
## observed/modeled snowline/SMB comparison
slas_elas_fn = os.path.join(data_path, 'analysis', 'monthly_SLAs_annual_ELAs_observed_modeled.nc')
slas_elas = xr.load_dataset(slas_elas_fn)
slas_elas

In [None]:
# PyGEM summary statistics
summary_fn = os.path.join(data_path, 'analysis', "PyGEM_comparison_summary.nc")
summary = xr.open_dataset(summary_fn)
summary

In [None]:
# PyGEM summary
pygem_summary_fn = os.path.join(data_path, 'analysis', 'PyGEM_comparison_summary.nc')
pygem_summary = xr.open_dataset(pygem_summary_fn)
pygem_summary

## Classifications

In [None]:
# Classifications
rgi_ids = aois['RGIId'].drop_duplicates().values
rgi_id = rgi_ids[0]
classifications_fn = os.path.join(data_path, 'classifications', f"{rgi_id}_classifications.zarr")
ds = xr.open_zarr(classifications_fn)
ds