In [3]:
import xarray as xr
import numpy as np
import matplotlib.pyplot as plt
from math import nan
import glob
import dask
import datetime
from dateutil.relativedelta import relativedelta
from functools import partial
import pandas as pd
import sys

from smyleutils import filter_utils as filt
from CASutils import readdata_utils as read

dask.config.set(**{'array.slicing.split_large_chunks': True})

<dask.config.set at 0x14b799ba2250>

In [4]:
ystart = 1970 # start year of hindcasts 
yend = 2020 # end year of hindcasts
nyears = yend - ystart + 1
initmon=11
initmonstr = str(initmon).zfill(2)
nmems = 20 # the number of hindcast members
memstr = [str(i).zfill(3) for i in np.arange(1,nmems+1,1)] # generating member strings
topdir = "/glade/campaign/cesm/development/espwg/SMYLE-CW3E/timeseries/daily/FLUT/"
expname = "b.e21.BSMYLE-CW3E"
outpath="/glade/campaign/cgd/cas/islas/python/smyle_cw3e/DATA_SORT/mjo_filter/"

### Set up the dask cluster

In [5]:
from dask_jobqueue import PBSCluster
from dask.distributed import Client

cluster = PBSCluster(
    cores = 1,
    memory = '10GB',
    processes = 1,
    queue = 'casper',
    local_directory='$TMPDIR',
    resource_spec='select=1:ncpus=1:mem=10GB',
    project='P04010022',
    walltime='03:00:00',
    interface='ext')

# scale up
cluster.scale(20)

# change your urls to the dask dashboard so that you can see it
dask.config.set({'distributed.dashboard.link':'https://jupyterhub.hpc.ucar.edu/stable/user/{USER}/proxy/{port}/status'})

# Setup your client
client = Client(cluster)

Perhaps you already have a cluster running?
Hosting the HTTP server on port 44359 instead
  f"Port {expected} is already in use.\n"


In [6]:
cluster

0,1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/44359/status,Workers: 20
Total threads: 20,Total memory: 186.20 GiB

0,1
Comm: tcp://128.117.208.112:46699,Workers: 14
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/44359/status,Total threads: 14
Started: Just now,Total memory: 130.34 GiB

0,1
Comm: tcp://128.117.208.83:36229,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/42381/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.83:38301,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-1l2h_z12,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-1l2h_z12

0,1
Comm: tcp://128.117.208.86:45251,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/33401/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.86:43247,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-3y36u8ro,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-3y36u8ro

0,1
Comm: tcp://128.117.208.83:36961,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/36827/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.83:35959,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-66fvp5_u,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-66fvp5_u

0,1
Comm: tcp://128.117.208.83:39819,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/33261/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.83:36277,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-gxwsld_s,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-gxwsld_s

0,1
Comm: tcp://128.117.208.91:38851,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/44225/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.91:40501,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-pudo1_gs,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-pudo1_gs

0,1
Comm: tcp://128.117.208.86:42527,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/39519/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.86:33587,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-68tm1rlq,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-68tm1rlq

0,1
Comm: tcp://128.117.208.91:39825,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/34475/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.91:39253,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-j9mnrjxm,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-j9mnrjxm

0,1
Comm: tcp://128.117.208.86:42063,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/40461/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.86:43309,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-75t5eecy,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-75t5eecy

0,1
Comm: tcp://128.117.208.86:34955,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/46657/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.86:42183,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-wd4kzmdo,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-wd4kzmdo

0,1
Comm: tcp://128.117.208.91:34845,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/36025/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.91:36469,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-r4iq50pa,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-r4iq50pa

0,1
Comm: tcp://128.117.208.91:46345,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/45719/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.91:34909,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-7n_meo_o,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-7n_meo_o

0,1
Comm: tcp://128.117.208.91:34147,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/36639/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.91:41789,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-6qt18ate,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-6qt18ate

0,1
Comm: tcp://128.117.208.86:43731,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/38001/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.86:42877,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-_n51j9h9,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-_n51j9h9

0,1
Comm: tcp://128.117.208.83:35967,Total threads: 1
Dashboard: https://jupyterhub.hpc.ucar.edu/stable/user/islas/proxy/33799/status,Memory: 9.31 GiB
Nanny: tcp://128.117.208.83:37027,
Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-7f0u9fjq,Local directory: /glade/derecho/scratch/islas/tmp/dask-worker-space/worker-7f0u9fjq


### Loop over members to calculate the MJO filtered OLR for each year.  So treating each individual member like the OBS.  Removing a seasonal cycle that's just the average over years of a given day.  I would normally remove some number of harmonics but we only have 6 months in the L83.

In [7]:
def preprocessor(ds):
    # sort out the times so that each member has the same time axis
    #timebndavg = np.array(ds.time_bnds,
    #                     dtype = 'datetime64[s]').view('i8').mean(axis=1).astype('datetime64[s]')
    #ds['time'] = timebndavg
    ds = read.fixcesmtime_daily(ds)
    ds = ds.where( ds.time.dt.hour == 12, drop=True)
    datestart=pd.to_datetime("1970-"+str(ds.isel(time=0).time.dt.month.values).zfill(2)+"-"+str(ds.isel(time=0).time.dt.day.values).zfill(2)+
                       "-"+str(ds.isel(time=0).time.dt.hour.values), format="%Y-%m-%d-%H")
    time = [ datestart + relativedelta(days=int(i)) for i in np.arange(0,ds.time.size,1) ]
    ds['time'] = time
    ds = ds.sel(lat=slice(-40,40))
    return ds

In [11]:
mjostdout = []
for imem in np.arange(1,len(memstr)+1,1):
    print(imem)
    files = [glob.glob(topdir+expname+"*."+str(imem).zfill(3)+".cam.h1.FLUT."+str(iyear)+initmonstr+"01-*.nc")[0] for iyear in np.arange(ystart,yend+1,1)]
    dat = xr.open_mfdataset(files, combine='nested', concat_dim=['init_year'],
                            parallel=True, data_vars=['FLUT'], coords='minimal', compat='override', preprocess=partial(preprocessor)).FLUT
    dat = dat.sel(time=slice("1970-11-01","1971-04-30"))
    datclim = dat.mean('time')
    datanoms = dat - datclim
    datanoms = datanoms.sel(time=slice("1970-11-01","1971-04-30"))
    
    mjofilt=[]
    for iyear in np.arange(0,datanoms.init_year.size,1):
        mjofilt.append(filt.wkfilter(datanoms.isel(init_year=iyear), 0.15, 1, 5, 20, 100, spd=1))
        
    mjofilt = xr.concat(mjofilt, dim='init_year')
    mjofilt = mjofilt.sel(time=slice("1970-12-01","1971-02-28"))
    mjostd = mjofilt.std('time')
    
    mjostdout.append(mjostd)
    
mjostdout = xr.concat(mjostdout, dim='M')   
mjostdout = mjostdout.rename('MJO_OLR')
mjostdout.to_netcdf(outpath+'MJOfilteredOLR_SMYLE_L32_init'+initmonstr+'.nc')

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20


In [9]:
print(dat)

<xarray.DataArray 'FLUT' (init_year: 51, time: 365, lat: 84, lon: 288)>
dask.array<concatenate, shape=(51, 365, 84, 288), dtype=float32, chunksize=(1, 365, 84, 288), chunktype=numpy.ndarray>
Coordinates:
  * lat      (lat) float64 -39.11 -38.17 -37.23 -36.28 ... 37.23 38.17 39.11
  * lon      (lon) float64 0.0 1.25 2.5 3.75 5.0 ... 355.0 356.2 357.5 358.8
  * time     (time) datetime64[ns] 1970-11-01T12:00:00 ... 1971-10-31T12:00:00
Dimensions without coordinates: init_year
Attributes:
    Sampling_Sequence:  rad_lwsw
    units:              W/m2
    long_name:          Upwelling longwave flux at top of model
    cell_methods:       time: mean
