In [1]:
import matplotlib.pyplot as plt
import numpy as np
from numpy import ma
import xarray as xr
import geopandas as gpd
import pandas as pd
# requires cartopy to be installed
import cartopy.feature as cfeature
import cartopy.io.shapereader as shpreader

import cartopy.crs as ccrs # for projection
import cartopy.feature as cfeature # for map features
from cartopy.util import add_cyclic_point
from matplotlib.axes import Axes
from cartopy.mpl.geoaxes import GeoAxes
#from matplotlib.colors import TwoSlopeNorm
from cartopy.mpl.gridliner import LONGITUDE_FORMATTER, LATITUDE_FORMATTER
import xesmf as xe 
import sys
import os
import dask

In [2]:
models = ["BNU-ESM", "CNRM-CM5", "CSIRO-Mk3-6-0", "CanESM2", "GFDL-ESM2G", "GFDL-ESM2M", "HadGEM2-CC365", "HadGEM2-ES365", "IPSL-CM5A-LR",
         "IPSL-CM5A-MR", "IPSL-CM5B-LR", "MIROC-ESM-CHEM", "MIROC-ESM", "MIROC5", "bcc-csm1-1-m", "MRI-CGCM3", "bcc-csm1-1", "inmcm4"]

In [3]:
from dask_jobqueue import SLURMCluster

cluster = SLURMCluster(cores=2,
                       processes=2,
                       memory="80GB",
                       walltime="04:00:00",
                       scheduler_options={'host': '172.22.179.3:7663'}) # Change the last 4 numbers here to something else between 7000-8000

cluster.scale(18)

In [4]:
from dask.distributed import Client

client = Client(cluster)

client

0,1
Connection method: Cluster object,Cluster type: dask_jobqueue.SLURMCluster
Dashboard: /proxy/8787/status,

0,1
Dashboard: /proxy/8787/status,Workers: 16
Total threads: 16,Total memory: 596.00 GiB

0,1
Comm: tcp://172.22.179.3:7663,Workers: 16
Dashboard: /proxy/8787/status,Total threads: 16
Started: Just now,Total memory: 596.00 GiB

0,1
Comm: tcp://172.22.178.61:33456,Total threads: 1
Dashboard: /proxy/45928/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.61:36875,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-t64use6r,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-t64use6r

0,1
Comm: tcp://172.22.178.61:34698,Total threads: 1
Dashboard: /proxy/45439/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.61:36852,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-i1vkryy4,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-i1vkryy4

0,1
Comm: tcp://172.22.178.81:41203,Total threads: 1
Dashboard: /proxy/44870/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.81:34087,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-vf1d4bhn,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-vf1d4bhn

0,1
Comm: tcp://172.22.178.81:33165,Total threads: 1
Dashboard: /proxy/35822/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.81:36013,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-2yczthr3,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-2yczthr3

0,1
Comm: tcp://172.22.178.80:36945,Total threads: 1
Dashboard: /proxy/36392/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.80:36532,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-487r7wfb,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-487r7wfb

0,1
Comm: tcp://172.22.178.80:41183,Total threads: 1
Dashboard: /proxy/43553/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.80:45578,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-ze4gxch_,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-ze4gxch_

0,1
Comm: tcp://172.22.178.82:39534,Total threads: 1
Dashboard: /proxy/43323/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.82:41779,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-wbjyzfa_,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-wbjyzfa_

0,1
Comm: tcp://172.22.178.82:39780,Total threads: 1
Dashboard: /proxy/42269/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.82:36862,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-bwq73gsn,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-bwq73gsn

0,1
Comm: tcp://172.22.178.102:33985,Total threads: 1
Dashboard: /proxy/44200/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.102:44168,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-dxjhlxdo,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-dxjhlxdo

0,1
Comm: tcp://172.22.178.102:46156,Total threads: 1
Dashboard: /proxy/45726/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.102:43106,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-kt8fdzoa,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-kt8fdzoa

0,1
Comm: tcp://172.22.178.103:41246,Total threads: 1
Dashboard: /proxy/45994/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.103:33748,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-k7vfm7_a,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-k7vfm7_a

0,1
Comm: tcp://172.22.178.103:35684,Total threads: 1
Dashboard: /proxy/44807/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.103:43883,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-vvxejn8n,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-vvxejn8n

0,1
Comm: tcp://172.22.178.79:46365,Total threads: 1
Dashboard: /proxy/32993/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.79:45599,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-lje5q2y5,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-lje5q2y5

0,1
Comm: tcp://172.22.178.79:43025,Total threads: 1
Dashboard: /proxy/34719/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.79:33067,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-og4vt5iy,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-og4vt5iy

0,1
Comm: tcp://172.22.178.62:43390,Total threads: 1
Dashboard: /proxy/39965/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.62:45801,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-73xm8stq,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-73xm8stq

0,1
Comm: tcp://172.22.178.62:34723,Total threads: 1
Dashboard: /proxy/36342/status,Memory: 37.25 GiB
Nanny: tcp://172.22.178.62:32827,
Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-n6de3gq4,Local directory: /data/keeling/a/ctavila2/tmp/dask-scratch-space/worker-n6de3gq4


In [5]:
def model_yearly_averages(model, start_day, end_day, lon_max, lon_min, lat_max, lat_min):
    base_path_H = "/data/keeling/a/davidcl2/d/MACA/FWI_RHmin/historical/out/comp/macav2metdata_fwi_" + model + "_r1i1p1_historical_"
    base_path_85 = "/data/keeling/a/davidcl2/d/MACA/FWI_RHmin/rcp85/out/macav2metdata_fwi_" + model + "_r1i1p1_rcp85_"
    
    # Initialize an empty list to store the datasets
    datasets = []
    
    # Loop through the years from 1950 to 1980 (adjust as needed)
    for year in range(1975, 2004, 5):
        # Construct the file path for the current 5-year range
        file_path = f"{base_path_H}{year}_{year + 4}_CONUS_daily.nc"
        
        # Open the dataset and append it to the list
        ds = xr.open_dataset(file_path)
        day_ds = ds.apply(lambda x: x.where((x['time.dayofyear'] >= start_day) & (x['time.dayofyear'] <= end_day)))
        averaged_yearly = day_ds.groupby('time.year').mean(dim='time')
        datasets.append(averaged_yearly)
        
    filein2005 = "/data/keeling/a/davidcl2/d/MACA/FWI_RHmin/historical/out/comp/macav2metdata_fwi_" + model + "_r1i1p1_historical_2005_2005_CONUS_daily.nc"
    ds = xr.open_dataset(filein2005)
    day_ds = ds.apply(lambda x: x.where((x['time.dayofyear'] >= start_day) & (x['time.dayofyear'] <= end_day)))
    averaged_yearly = day_ds.groupby('time.year').mean(dim='time')
    datasets.append(averaged_yearly)
    
    for year in range(2006, 2060, 5):
        
        file_path = f"{base_path_85}{year}_{year + 4}_CONUS_daily.nc"
        
        # Open the dataset and append it to the list
        ds = xr.open_dataset(file_path)
        day_ds = ds.apply(lambda x: x.where((x['time.dayofyear'] >= start_day) & (x['time.dayofyear'] <= end_day)))
        averaged_yearly = day_ds.groupby('time.year').mean(dim='time')
        datasets.append(averaged_yearly)
    
    
    # Drop any NaN values created by the mask
    concatenated_ds = xr.concat(datasets, dim='year')
    selected_ds = concatenated_ds.dropna(dim='year', how='all')
    #annual_mean = selected_ds.groupby('time.year').mean(dim='time')
    selected_ds["lon"] = np.where(selected_ds["lon"] > 180, selected_ds["lon"] - 360, selected_ds["lon"])
    selected_ds = selected_ds.sortby("lon")
    
    annual_mean_boundaries = selected_ds.where((selected_ds.lon >= lon_min) & (selected_ds.lon <= lon_max) & (selected_ds.lat >= lat_min) & (selected_ds.lat <= lat_max), drop=True)
    annual_mean_boundaries = annual_mean_boundaries.mean(dim=['lat'])
    annual_mean_boundaries = annual_mean_boundaries.mean(dim=['lon'])
    
    output_path = "/data/keeling/a/ctavila2/7_bootstrapping/models_yearly_points/macav2metdata_fwi_" + model + "_r1i1p1_rcp8.5_tmaxrhmin_1979_2022_CONUS_yearly_points.nc"
    
    # Save the dataset to a .nc file
    annual_mean_boundaries.to_netcdf(output_path)
    
    print("iteration " + model)
    


In [6]:
delayed = []
for model in models: # only do for 5 models
    out = dask.delayed(model_yearly_averages)(model=model, start_day=152, end_day=304, lon_max=-114.016667, lon_min=-124.766667, lat_max = 50, lat_min = 32.025)
    delayed.append(out)



In [11]:
results = dask.compute(*delayed)  # Specify distributed scheduler