In [1]:
import subprocess
import shlex
import os
import glob

from subprocess import PIPE
from pathlib import Path

In [2]:
def submit_cuda_spatially_explicit(
    repeats=10, walltime=1, speciation=0.000001, sample=0.00025, memory=24,
    config='()', reporters=['Execution()', 'Biodiversity()'], output='./STDIN'
):
    output = Path(output).resolve(strict=False)
    output.parent.mkdir(parents=True, exist_ok=True)
    
    glob_pathname = f"{glob.escape(output)}.e*.*"
    
    successful = []
    erroneous = []
    
    for path in glob.iglob(glob_pathname):
        with open(path) as file:
            content = file.read()
            
            if content == '':
                successful.append(path)
            else:
                erroneous.append(path)
                
    for error_path in erroneous:
        Path('o'.join(error_path.rsplit('e', 1))).unlink()
        Path(error_path).unlink()
        
    repeats = repeats - len(successful)
    
    if repeats < 1:
        return None
    
    print(f"{repeats} x {output}")
    
    repeats = max(repeats, 2)
    
    walltime = "{:02d}".format(walltime)
    reporters = ','.join(reporters)
    
    config = fr"""
    #PBS -lselect={1}:ncpus={1}:mem={memory}gb:ngpus={1}:gpu_type=P1000
    #PBS -J 0-{max(repeats - 1, 0)}
    #PBS -lwalltime={walltime}:00:00
    
    echo $CUDA_VISIBLE_DEVICES
    
    nvidia-smi

    $HOME/necsim-rust/target-cuda/release/rustcoalescence simulate '(
        speciation: {speciation},
        sample: {sample},
        seed: '$(python3 -c "import random; print(random.getrandbits(64))")',

        algorithm: CUDA(
            device: {0},
            ptx_jit: true,
            {config.strip()[1:-1]}
        ),

        scenario: SpatiallyExplicit(
            habitat: "'$HOME'/necsim-rust/maps/madingley/fg0size12/habitat.tif",
            dispersal: "'$HOME'/necsim-rust/maps/madingley/fg0size12/dispersal.tif",
        ),

        reporters: [
            Plugin(
                library: "'$HOME'/necsim-rust/target-cuda/release/deps/libnecsim_plugins_common.so",
                reporters: [{reporters}],
            ),
        ],
    )'
    """
    
    cwd = os.getcwd()
    os.chdir(output.parent)
    
    # Submit the simulation batch
    result = subprocess.run(shlex.split(
        f"{os.environ['HOME']}/qsubbuf/target/release/qsubbuf -N {output.name}"
    ), check=True, input=config, stdout=PIPE, universal_newlines=True).stdout.strip()
    
    os.chdir(cwd)
    
    return result

In [3]:
def submit_cuda_spatially_explicit_with_log(
    repeats=10, walltime=1, speciation=0.000001, sample=0.00025,
    config='()', reporters=['Execution()', 'Biodiversity()'], output='./STDIN'
):
    output = Path(output).resolve(strict=False)
    output.parent.mkdir(parents=True, exist_ok=True)
    
    glob_pathname = f"{glob.escape(output)}.e*.*"
    
    successful = []
    erroneous = []
    
    for path in glob.iglob(glob_pathname):
        with open(path) as file:
            content = file.read()
            
            if content == '':
                successful.append(path)
            else:
                erroneous.append(path)
                
    for error_path in erroneous:
        Path('o'.join(error_path.rsplit('e', 1))).unlink()
        Path(error_path).unlink()
        
    repeats = repeats - len(successful)
    
    if repeats < 1:
        return None
    
    print(f"{repeats} x {output}")
    
    repeats = max(repeats, 2)
    
    walltime = "{:02d}".format(walltime)
    reporters = ','.join(reporters)
    
    config = fr"""
    #PBS -lselect={1}:ncpus={1}:mem={24}gb:ngpus={1}:gpu_type=P1000
    #PBS -J 0-{max(repeats - 1, 0)}
    #PBS -lwalltime={walltime}:00:00
    
    echo $CUDA_VISIBLE_DEVICES
    
    nvidia-smi

    $HOME/necsim-rust/target-cuda/release/rustcoalescence simulate '(
        speciation: {speciation},
        sample: {sample},
        seed: '$(python3 -c "import random; print(random.getrandbits(64))")',

        algorithm: CUDA(
            device: {0},
            ptx_jit: true,
            {config.strip()[1:-1]}
        ),

        scenario: SpatiallyExplicit(
            habitat: "'$HOME'/necsim-rust/maps/madingley/fg0size12/habitat.tif",
            dispersal: "'$HOME'/necsim-rust/maps/madingley/fg0size12/dispersal.tif",
        ),
        
        log: "'$TMPDIR'/event_log",

        reporters: [
            Plugin(
                library: "'$HOME'/necsim-rust/target-cuda/release/deps/libnecsim_plugins_common.so",
                reporters: [{reporters}],
            ),
        ],
    )'
    
    $HOME/necsim-rust/target-replay/release/rustcoalescence replay '(
        logs: [
            "'$(echo $TMPDIR | sed "s:\[\([0-9]\+\)\]:\[\[\]\1\[\]\]:g")'/event_log/*/*"
        ],

        reporters: [
            Plugin(
                library: "'$HOME'/necsim-rust/target-replay/release/deps/libnecsim_plugins_common.so",
                reporters: [{reporters}],
            ),
        ],
    )'
    """
    
    cwd = os.getcwd()
    os.chdir(output.parent)
    
    # Submit the simulation batch
    result = subprocess.run(shlex.split(
        f"{os.environ['HOME']}/qsubbuf/target/release/qsubbuf -N {output.name}"
    ), check=True, input=config, stdout=PIPE, universal_newlines=True).stdout.strip()
    
    os.chdir(cwd)
    
    return result

In [4]:
for delta_t in [0.1, 0.5, 1.0, 1.5, 2.0, 2.5, 3.0, 3.5, 3.75, 4.0, 4.25, 4.5, 5.0, 5.5, 6.0, 7.0, 8.0, 10.0, 12.0, 16.0, 20.0]:
    submit_cuda_spatially_explicit(
        walltime=6, repeats=10, speciation=0.000001, sample=0.00025,
        config=f"(delta_t:{delta_t})", output=f"delta-t/pbs.{delta_t}",
    )

In [5]:
for event_slice, memory in [
    (1000000, 16), (1778279, 16), (3162278, 16), (10000000, 16), (17782794, 16), (31622777, 16),
    (100000000, 16), (177827941, 24), (316227766, 36), (1000000000, 96)
]:
    submit_cuda_spatially_explicit(
        walltime=6, repeats=10, speciation=0.000001, sample=0.00025, memory=memory, reporters=['Execution()', 'Biodiversity()', 'Counter()'],
        config=f"(parallelism_mode:Monolithic(event_slice:{event_slice}))", output=f"event-slice/pbs.{event_slice}",
    )

In [6]:
for event_slice in [1000, 1778, 3162, 10000, 17783, 31623, 100000, 177828, 316228, 1000000, 1778279, 3162278, 10000000]:
    submit_cuda_spatially_explicit(
        walltime=2, repeats=10, speciation=0.0001, sample=0.0000025, reporters=['Execution()', 'Biodiversity()', 'Counter()'],
        config=f"(parallelism_mode:Monolithic(event_slice:{event_slice}))", output=f"event-slice-live/pbs.{event_slice}",
    )

In [7]:
for event_slice in [1000, 1778, 3162, 10000, 17783, 31623, 100000, 177828, 316228, 1000000, 1778279, 3162278, 10000000]:
    submit_cuda_spatially_explicit_with_log(
        walltime=2, repeats=10, speciation=0.0001, sample=0.0000025, reporters=['Execution()', 'Biodiversity()', 'Counter()'],
        config=f"(parallelism_mode:Monolithic(event_slice:{event_slice}))", output=f"event-slice-log/pbs.{event_slice}",
    )

In [8]:
for dedup_capacity in [1000, 3162, 10000, 31623, 100000, 316228, 1000000, 3162278, 10000000]:
    submit_cuda_spatially_explicit(
        walltime=6, repeats=10, speciation=0.000001, sample=0.00025,
        config=f"(dedup_cache:Absolute(capacity:{dedup_capacity}))",
        output=f"dedup-capacity/pbs.{dedup_capacity}",
    )

In [9]:
for block_size in [4, 16, 32, 64, 128, 256, 512, 1024]:
    for grid_size in [4, 16, 64, 256, 1024]:
        submit_cuda_spatially_explicit(
            walltime=6, repeats=10, speciation=0.000001, sample=0.00025,
            config=f"(block_size:{block_size},grid_size:{grid_size})",
            output=f"block-grid/pbs.{block_size}.{grid_size}",
        )

In [10]:
for (speciation, sample) in [
    (0.000001, 0.00025), (1.0, 0.00025), (0.01, 0.000025), (0.0001, 0.0000025), (0.000001, 0.00000025), 
]:
    for step_slice in [10, 50, 100, 150, 200, 250, 300, 350]:
        submit_cuda_spatially_explicit(
            walltime=6, repeats=10, speciation=speciation, sample=sample,
            config=f"(step_slice:{step_slice})",
            output=f"step-slice/pbs.{speciation}.{sample}.{step_slice}",
        )