-
Notifications
You must be signed in to change notification settings - Fork 1
/
distrib_batch_etw.sh
63 lines (54 loc) · 2.23 KB
/
distrib_batch_etw.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
#!/bin/bash
#SBATCH --job-name=navigation-analysis-habitat
#SBATCH --output=/checkpoint/%u/jobs/job.%j.out
#SBATCH --error=/checkpoint/%u/jobs/job.%j.err
#SBATCH --gpus-per-task 1
#SBATCH --nodes 1
#SBATCH --cpus-per-task 10
#SBATCH --ntasks-per-node 8
#SBATCH --mem-per-cpu=5GB
#SBATCH --partition=priority
#SBATCH --comment="iclr talk 4/8"
#SBATCH --time=72:00:00
#SBATCH --signal=USR1@300
#SBATCH --open-mode=append
#SBATCH --constraint=volta32gb
echo ${PYTHONPATH}
echo "Using setup for Erik"
. /private/home/erikwijmans/miniconda3/etc/profile.d/conda.sh
conda deactivate
conda activate nav-analysis-base
BASE_EXP_DIR="/checkpoint/erikwijmans/exp-dir"
CURRENT_DATETIME="`date +%Y_%m_%d_%H_%M_%S`";
EXP_DIR="${BASE_EXP_DIR}/exp_habitat_api_navigation_analysis_datetime_${CURRENT_DATETIME}"
mkdir -p ${EXP_DIR}
ENV_NAME="gibson-challenge-mp3d-gibson-se-neXt25-depth"
ENV_NAME="gibson-2plus-resnet50-dpfrl-depth"
# ENV_NAME="mp3d-gibson-all-loopnav-stop-grad"
# ENV_NAME="gibson-public-50-single-GPU-depth"
# ENV_NAME="gibson-2plus-se-neXt101-lstm1024-long-depth"
# ENV_NAME="mp3d-gibson-all-loopnav-noreturn-baseline-blind"
# ENV_NAME="mp3d-gibson-50-online-long-depth"
ENV_NAME="gibson-public-flee-pointnav-ftune-rgb-r${SLURM_ARRAY_TASK_ID}"
# ENV_NAME="mp3d-only-loopnav-stage-2-trained-state-blind"
# ENV_NAME="mp3d-gibson-all-pointnav-mem_${mem_len}-blind"
# ENV_NAME="mp3d-gibson-all-pointnav-no-memory-blind"
# ENV_NAME="testing"
CHECKPOINT="data/checkpoints/transfer/${ENV_NAME}"
export LD_LIBRARY_PATH=/usr/lib/x86_64-linux-gnu/nvidia-opengl:${LD_LIBRARY_PATH}
export GLOG_minloglevel=3
export MAGNUM_LOG=quiet
export MASTER_ADDR=$(srun --ntasks=1 hostname 2>&1 | tail -n1)
printenv | grep SLURM
set -x
srun --kill-on-bad-exit=1 \
python -u -m nav_analysis.train_ppo_distrib \
--extra-confs \
nav_analysis/configs/experiments/pointnav-rgb/se-resneXt50-rgb.yaml \
nav_analysis/configs/experiments/transfer/flee_scratch.yaml \
nav_analysis/configs/experiments/transfer/use_gibson_2plus_se_resneXt50_rgb_weights.yaml \
nav_analysis/configs/experiments/transfer/use_policy_weights.yaml \
--opts \
"logging.log_file=${EXP_DIR}/log.txt" \
"logging.checkpoint_folder=${CHECKPOINT}" \
"logging.tensorboard_dir=runs/${ENV_NAME}"