# Generate qsub scripts for STEP00 operations

This notebook generates a set of PBS scripts and a bash script that submits all the PBS jobs. It works on the data analysis server of NSF NCAR: `casper.ucar.edu`.

In [1]:
import os
import yaml
import numpy as np

In [2]:
config_name = os.path.realpath('verif_config.yml')

with open(config_name, 'r') as stream:
    conf = yaml.safe_load(stream)

## Gather wxformer (Large)

In [3]:
INDs = np.arange(1544, 2192+5, 5)
INDs[-1] = 2192

In [5]:
for i, ind_start in enumerate(INDs[:-1]):
    
    ind_end = INDs[i+1]
    
    f = open('{}gather_WX_{:03d}.sh'.format(conf['qsub']['qsub_loc'], i), 'w') 
    
    heads = '''#!/bin/bash -l

#PBS -N gather_WX
#PBS -A NAML0001
#PBS -l walltime=23:59:59
#PBS -l select=1:ncpus=4:mem=64GB
#PBS -q casper
#PBS -o gather_WX.log
#PBS -e gather_WX.err

conda activate credit
cd {}
python STEP00_gather_wxformer.py {} {}
'''.format(conf['qsub']['scripts_loc'], ind_start, ind_end, ind_start, ind_end)
    
    print(heads, file=f)    
    f.close()

f = open('{}step00_gather_WX_all.sh'.format(conf['qsub']['qsub_loc']), 'w')

for i, ind_start in enumerate(INDs[:-1]):
    print('qsub gather_WX_{:03d}.sh'.format(i), file=f)
    
f.close()

## Gather IFS

In [3]:
INDs = np.arange(1400, 3700+20, 20)

In [4]:
for i, ind_start in enumerate(INDs[:-1]):
    
    ind_end = INDs[i+1]
    
    f = open('{}gather_IFS_{:03d}.sh'.format(conf['qsub']['qsub_loc'], i), 'w') 
    
    heads = '''#!/bin/bash -l

#PBS -N IFS
#PBS -A NAML0001
#PBS -l walltime=23:59:59
#PBS -l select=1:ncpus=4:mem=64GB
#PBS -q casper
#PBS -o gather_IFS.log
#PBS -e gather_IFS.err

conda activate credit
cd {}
python STEP00_gather_IFS.py {} {}
'''.format(conf['qsub']['scripts_loc'], ind_start, ind_end, ind_start, ind_end)
    
    print(heads, file=f)    
    f.close()

f = open('{}step00_gather_IFS_all.sh'.format(conf['qsub']['qsub_loc']), 'w')

for i, ind_start in enumerate(INDs[:-1]):
    print('qsub gather_IFS_{:03d}.sh'.format(i), file=f)
    
f.close()

## Gather ERA5 (x)

In [5]:
INDs = np.arange(86200, 93544+100, 100)

In [7]:
for i, ind_start in enumerate(INDs[:-1]):
    
    ind_end = INDs[i+1]
    
    f = open('{}gather_ERA5_{:03d}.sh'.format(conf['qsub']['qsub_loc'], i), 'w') 
    
    heads = '''#!/bin/bash -l

#PBS -N ERA5
#PBS -A NAML0001
#PBS -l walltime=23:59:59
#PBS -l select=1:ncpus=4:mem=64GB
#PBS -q casper
#PBS -o gather_ERA5.log
#PBS -e gather_ERA5.err

conda activate credit
cd {}
python STEP00_gather_ERA5.py {} {}
'''.format(conf['qsub']['scripts_loc'], ind_start, ind_end, ind_start, ind_end)
    
    print(heads, file=f)    
    f.close()

f = open('{}step00_gather_ERA5_all.sh'.format(conf['qsub']['qsub_loc']), 'w')

for i, ind_start in enumerate(INDs[:-1]):
    print('qsub gather_ERA5_{:03d}.sh'.format(i), file=f)
    
f.close()