# Notebook to Gather Bronze Data 

# Step 0 Notebook Set Up 

In [1]:
# import needed modules 
import os
import ee 
import xarray as xr 
import zarr 
import boto3
import easysnowdata 
from snowML.datapipe.utils import set_data_constants as sdc
from snowML.datapipe import get_bronze as gb
from snowML.datapipe.utils import get_geos as gg
from snowML.datapipe import bronze_to_gold as btg
from snowML.datapipe.to_silver import to_silver as silver
from snowML.datapipe.to_silver import combine_silver as cs 
from snowML.datapipe import to_model_ready as gtm
from snowML.datapipe.utils import data_utils as du

In [2]:
ee.Authenticate(auth_mode='notebook')

True

In [3]:
ee.Initialize(project = "ee-frostydawgs") # Replace with your project name 

In [7]:
os.environ['AWS_PROFILE'] = 'sue_private'

# Step 1 - Define S3 Buckets to Use 

In [5]:
BUCKET_DICT = sdc.create_bucket_dict("sue-private")
BUCKET_DICT

{'shape-bronze': 'snowml2-shape',
 'bronze': 'snowml2-bronze',
 'silver': 'snowml2-silver',
 'gold': 'snowml2-gold',
 'model-ready': 'snowml2-model-ready'}

# Step 2 - Get the Data

In [8]:
bucket_nm = BUCKET_DICT["bronze"] 
var = "swe" 
yr_start = 1983
yr_end =  2022
gb.get_bronze(var, bucket_nm, year_start = yr_start, year_end = yr_end)

Resuming with completed years: []
Processing year: 1983
Downloading https://daacdata.apps.nsidc.org/pub/DATASETS/nsidc0719_SWE_Snow_Depth_v1/4km_SWE_Depth_WY1983_v01.nc
<xarray.Dataset> Size: 3GB
Dimensions:   (lat: 621, lon: 1405, time: 365, time_str_len: 11)
Coordinates:
  * lat       (lat) float32 2kB 24.08 24.12 24.17 24.21 ... 49.83 49.88 49.92
  * lon       (lon) float32 6kB -125.0 -125.0 -124.9 ... -66.58 -66.54 -66.5
  * time      (time) datetime64[ns] 3kB 1982-10-01 1982-10-02 ... 1983-09-30
Dimensions without coordinates: time_str_len
Data variables:
    crs       |S1 1B ...
    time_str  (time_str_len, time) |S1 4kB dask.array<chunksize=(11, 365), meta=np.ndarray>
    SWE       (time, lat, lon) float32 1GB dask.array<chunksize=(61, 104, 235), meta=np.ndarray>
    DEPTH     (time, lat, lon) float32 1GB dask.array<chunksize=(61, 104, 235), meta=np.ndarray>
Created new Zarr file at s3://snowml2-bronze/swe_all.zarr
Processing year: 1984
Downloading https://daacdata.apps.nsidc.or

'swe_all.zarr'

In [10]:
var_list_wrf = ["pr", "tmmn", "tmmx", "vs", "srad", "rmax", "rmin"]
yr_end = 2024

In [11]:
gb.get_bronze(var_list_wrf[0], bucket_nm, year_start = yr_start, year_end = yr_end)

Resuming with completed years: []
Processing year: 1983
Downloading http://www.northwestknowledge.net/metdata/data/pr_1983.nc
<xarray.Dataset> Size: 2GB
Dimensions:               (lon: 1386, lat: 585, day: 365, crs: 1)
Coordinates:
  * lon                   (lon) float64 11kB -124.8 -124.7 ... -67.1 -67.06
  * lat                   (lat) float64 5kB 49.4 49.36 49.32 ... 25.11 25.07
  * day                   (day) datetime64[ns] 3kB 1983-01-01 ... 1983-12-31
  * crs                   (crs) uint16 2B 3
Data variables:
    precipitation_amount  (day, lat, lon) float64 2GB dask.array<chunksize=(365, 98, 231), meta=np.ndarray>
Attributes: (12/19)
    geospatial_bounds_crs:      EPSG:4326
    Conventions:                CF-1.6
    geospatial_bounds:          POLYGON((-124.7666666333333 49.40000000000000...
    geospatial_lat_min:         25.066666666666666
    geospatial_lat_max:         49.40000000000000
    geospatial_lon_min:         -124.7666666333333
    ...                         ...


'pr_all.zarr'

In [12]:
gb.get_bronze(var_list_wrf[1], bucket_nm, year_start = yr_start, year_end = yr_end)

Resuming with completed years: []
Processing year: 1983
Downloading http://www.northwestknowledge.net/metdata/data/tmmn_1983.nc
<xarray.Dataset> Size: 2GB
Dimensions:          (lon: 1386, lat: 585, day: 365, crs: 1)
Coordinates:
  * lon              (lon) float64 11kB -124.8 -124.7 -124.7 ... -67.1 -67.06
  * lat              (lat) float64 5kB 49.4 49.36 49.32 ... 25.15 25.11 25.07
  * day              (day) datetime64[ns] 3kB 1983-01-01 ... 1983-12-31
  * crs              (crs) uint16 2B 3
Data variables:
    air_temperature  (day, lat, lon) float64 2GB dask.array<chunksize=(365, 98, 231), meta=np.ndarray>
Attributes: (12/19)
    geospatial_bounds_crs:      EPSG:4326
    Conventions:                CF-1.6
    geospatial_bounds:          POLYGON((-124.7666666333333 49.40000000000000...
    geospatial_lat_min:         25.066666666666666
    geospatial_lat_max:         49.40000000000000
    geospatial_lon_min:         -124.7666666333333
    ...                         ...
    date:      

'tmmn_all.zarr'

In [14]:
gb.get_bronze(var_list_wrf[2], bucket_nm, year_start = yr_start, year_end = yr_end)

Resuming with completed years: []
Processing year: 1983
Downloading http://www.northwestknowledge.net/metdata/data/tmmx_1983.nc
<xarray.Dataset> Size: 2GB
Dimensions:          (lon: 1386, lat: 585, day: 365, crs: 1)
Coordinates:
  * lon              (lon) float64 11kB -124.8 -124.7 -124.7 ... -67.1 -67.06
  * lat              (lat) float64 5kB 49.4 49.36 49.32 ... 25.15 25.11 25.07
  * day              (day) datetime64[ns] 3kB 1983-01-01 ... 1983-12-31
  * crs              (crs) uint16 2B 3
Data variables:
    air_temperature  (day, lat, lon) float64 2GB dask.array<chunksize=(365, 98, 231), meta=np.ndarray>
Attributes: (12/19)
    geospatial_bounds_crs:      EPSG:4326
    Conventions:                CF-1.6
    geospatial_bounds:          POLYGON((-124.7666666333333 49.40000000000000...
    geospatial_lat_min:         25.066666666666666
    geospatial_lat_max:         49.40000000000000
    geospatial_lon_min:         -124.7666666333333
    ...                         ...
    date:      

'tmmx_all.zarr'

In [15]:
gb.get_bronze(var_list_wrf[3], bucket_nm, year_start = yr_start, year_end = yr_end)

Resuming with completed years: []
Processing year: 1983
Downloading http://www.northwestknowledge.net/metdata/data/vs_1983.nc
<xarray.Dataset> Size: 2GB
Dimensions:     (lon: 1386, lat: 585, day: 365, crs: 1)
Coordinates:
  * lon         (lon) float64 11kB -124.8 -124.7 -124.7 ... -67.14 -67.1 -67.06
  * lat         (lat) float64 5kB 49.4 49.36 49.32 49.28 ... 25.15 25.11 25.07
  * day         (day) datetime64[ns] 3kB 1983-01-01 1983-01-02 ... 1983-12-31
  * crs         (crs) uint16 2B 3
Data variables:
    wind_speed  (day, lat, lon) float64 2GB dask.array<chunksize=(365, 98, 231), meta=np.ndarray>
Attributes: (12/19)
    geospatial_bounds_crs:      EPSG:4326
    Conventions:                CF-1.6
    geospatial_bounds:          POLYGON((-124.7666666333333 49.40000000000000...
    geospatial_lat_min:         25.066666666666666
    geospatial_lat_max:         49.40000000000000
    geospatial_lon_min:         -124.7666666333333
    ...                         ...
    date:              

'vs_all.zarr'

In [16]:
gb.get_bronze(var_list_wrf[4], bucket_nm, year_start = yr_start, year_end = yr_end)

Resuming with completed years: []
Processing year: 1983
Downloading http://www.northwestknowledge.net/metdata/data/srad_1983.nc
<xarray.Dataset> Size: 2GB
Dimensions:                                    (lon: 1386, lat: 585, day: 365,
                                                crs: 1)
Coordinates:
  * lon                                        (lon) float64 11kB -124.8 ... ...
  * lat                                        (lat) float64 5kB 49.4 ... 25.07
  * day                                        (day) datetime64[ns] 3kB 1983-...
  * crs                                        (crs) uint16 2B 3
Data variables:
    surface_downwelling_shortwave_flux_in_air  (day, lat, lon) float64 2GB dask.array<chunksize=(365, 98, 231), meta=np.ndarray>
Attributes: (12/19)
    geospatial_bounds_crs:      EPSG:4326
    Conventions:                CF-1.6
    geospatial_bounds:          POLYGON((-124.7666666333333 49.40000000000000...
    geospatial_lat_min:         25.066666666666666
    geospati

'srad_all.zarr'

In [17]:
gb.get_bronze(var_list_wrf[5], bucket_nm, year_start = yr_start, year_end = yr_end)

Resuming with completed years: []
Processing year: 1983
Downloading http://www.northwestknowledge.net/metdata/data/rmax_1983.nc
<xarray.Dataset> Size: 2GB
Dimensions:            (lon: 1386, lat: 585, day: 365, crs: 1)
Coordinates:
  * lon                (lon) float64 11kB -124.8 -124.7 -124.7 ... -67.1 -67.06
  * lat                (lat) float64 5kB 49.4 49.36 49.32 ... 25.15 25.11 25.07
  * day                (day) datetime64[ns] 3kB 1983-01-01 ... 1983-12-31
  * crs                (crs) uint16 2B 3
Data variables:
    relative_humidity  (day, lat, lon) float64 2GB dask.array<chunksize=(365, 98, 231), meta=np.ndarray>
Attributes: (12/19)
    geospatial_bounds_crs:      EPSG:4326
    Conventions:                CF-1.6
    geospatial_bounds:          POLYGON((-124.7666666333333 49.40000000000000...
    geospatial_lat_min:         25.066666666666666
    geospatial_lat_max:         49.40000000000000
    geospatial_lon_min:         -124.7666666333333
    ...                         ...
   

'rmax_all.zarr'

In [18]:
gb.get_bronze(var_list_wrf[6], bucket_nm, year_start = yr_start, year_end = yr_end)

Resuming with completed years: []
Processing year: 1983
Downloading http://www.northwestknowledge.net/metdata/data/rmin_1983.nc
<xarray.Dataset> Size: 2GB
Dimensions:            (lon: 1386, lat: 585, day: 365, crs: 1)
Coordinates:
  * lon                (lon) float64 11kB -124.8 -124.7 -124.7 ... -67.1 -67.06
  * lat                (lat) float64 5kB 49.4 49.36 49.32 ... 25.15 25.11 25.07
  * day                (day) datetime64[ns] 3kB 1983-01-01 ... 1983-12-31
  * crs                (crs) uint16 2B 3
Data variables:
    relative_humidity  (day, lat, lon) float64 2GB dask.array<chunksize=(365, 98, 231), meta=np.ndarray>
Attributes: (12/19)
    geospatial_bounds_crs:      EPSG:4326
    Conventions:                CF-1.6
    geospatial_bounds:          POLYGON((-124.7666666333333 49.40000000000000...
    geospatial_lat_min:         25.066666666666666
    geospatial_lat_max:         49.40000000000000
    geospatial_lon_min:         -124.7666666333333
    ...                         ...
   

'rmin_all.zarr'