File tree Expand file tree Collapse file tree 12 files changed +53
-107
lines changed
Expand file tree Collapse file tree 12 files changed +53
-107
lines changed Load Diff This file was deleted.
Original file line number Diff line number Diff line change 1- source benchmarks/train_loop.sh
2- ALGOS=" ppo"
1+ ALGO=" ppo"
32ENVS=" PongNoFrameskip-v4 BreakoutNoFrameskip-v4"
43BENCHMARK_MAX_PROCS=" ${BENCHMARK_MAX_PROCS:- 3} "
5- train_loop $ALGOS " $ENVS " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
4+ bash benchmarks/ train_loop.sh -a $ALGO -e " $ENVS " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
Original file line number Diff line number Diff line change 1- source benchmarks/train_loop.sh
2- ALGOS=" ppo"
1+ ALGO=" ppo"
32ENVS=" SpaceInvadersNoFrameskip-v4 QbertNoFrameskip-v4"
43BENCHMARK_MAX_PROCS=" ${BENCHMARK_MAX_PROCS:- 3} "
5- train_loop $ALGOS " $ENVS " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
4+ bash benchmarks/ train_loop.sh -a $ALGO -e " $ENVS " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
Original file line number Diff line number Diff line change 1- source benchmarks/train_loop.sh
2- ALGOS=" ppo"
1+ ALGO=" ppo"
32ENVS=" CartPole-v1 MountainCar-v0 MountainCarContinuous-v0 Acrobot-v1 LunarLander-v2"
43BENCHMARK_MAX_PROCS=" ${BENCHMARK_MAX_PROCS:- 3} "
5- train_loop $ALGOS " $ENVS " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
4+ bash benchmarks/ train_loop.sh -a $ALGO -e " $ENVS " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
Original file line number Diff line number Diff line change 1- source benchmarks/train_loop.sh
2- ALGOS=" ppo"
1+ ALGO=" ppo"
32ENVS=" CarRacing-v0"
43BENCHMARK_MAX_PROCS=" ${BENCHMARK_MAX_PROCS:- 3} "
5- train_loop $ALGOS " $ENVS " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
4+ bash benchmarks/ train_loop.sh -a $ALGO -e " $ENVS " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
Original file line number Diff line number Diff line change 1- source benchmarks/train_loop.sh
2- ALGOS=" ppo"
1+ ALGO=" ppo"
32ENVS=" HalfCheetahBulletEnv-v0 AntBulletEnv-v0 HopperBulletEnv-v0 Walker2DBulletEnv-v0"
43BENCHMARK_MAX_PROCS=" ${BENCHMARK_MAX_PROCS:- 3} "
5- train_loop $ALGOS " $ENVS " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
4+ bash benchmarks/ train_loop.sh -a $ALGO -e " $ENVS " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
Original file line number Diff line number Diff line change 1- train_loop () {
2- local WANDB_TAGS=" benchmark_$( git rev-parse --short HEAD) host_$( hostname) "
3- local algo
4- local env
5- local seed
6- local WANDB_PROJECT_NAME=" ${WANDB_PROJECT_NAME:- rl-algo-impls-benchmarks} "
7- local SEEDS=" ${SEEDS:- 1 2 3} "
8- for algo in $( echo $1 ) ; do
9- for env in $( echo $2 ) ; do
10- for seed in $SEEDS ; do
11- echo python train.py --algo $algo --env $env --seed $seed --pool-size 1 --wandb-tags $WANDB_TAGS --wandb-project-name $WANDB_PROJECT_NAME
12- done
13- done
1+ while getopts a:e:s:p: flag
2+ do
3+ case " ${flag} " in
4+ a) algo=${OPTARG} ;;
5+ e) envs=${OPTARG} ;;
6+ s) seeds=${OPTARG} ;;
7+ p) project_name=${OPTARG} ;;
8+ esac
9+ done
10+
11+ WANDB_TAGS=" benchmark_$( git rev-parse --short HEAD) host_$( hostname) "
12+ project_name=" ${project_name:- rl-algo-impls-benchmarks} "
13+ seeds=" ${seeds:- 1 2 3} "
14+ for env in $( echo $envs ) ; do
15+ for seed in $seeds ; do
16+ echo python train.py --algo $algo --env $env --seed $seed --pool-size 1 --wandb-tags $WANDB_TAGS --wandb-project-name $project_name
1417 done
15- }
18+ done
Original file line number Diff line number Diff line change 1- source benchmarks/train_loop.sh
1+ while getopts a:j:s: flag
2+ do
3+ case " ${flag} " in
4+ a) algo=${OPTARG} ;;
5+ j) n_jobs=${OPTARG} ;;
6+ p) project_name=${OPTARG} ;;
7+ s) seeds=${OPTARG} ;;
8+ esac
9+ done
210
3- # export WANDB_PROJECT_NAME="rl-algo-impls"
11+ n_jobs=" ${n_jobs:- 6} "
12+ project_name=" ${project_name:- rl-algo-impls-benchmarks} "
13+ seeds=" ${seeds:- 1 2 3} "
414
5- BENCHMARK_MAX_PROCS=" ${BENCHMARK_MAX_PROCS:- 6} "
6-
7- ALGOS=(
8- # "vpg"
9- # "dqn"
10- " ppo"
11- # "a2c"
12- )
1315ENVS=(
1416 # Basic
1517 " CartPole-v1"
3133 " SpaceInvadersNoFrameskip-v4"
3234 " QbertNoFrameskip-v4"
3335)
34- train_loop " ${ALGOS [*]} " " ${ENVS[*]} " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
36+ bash benchmarks/ train_loop.sh -a $algo -e " ${ENVS [*]} " -p $project_name -s " $seeds " | xargs -I CMD -P $n_jobs bash -c CMD
Original file line number Diff line number Diff line change 1- source benchmarks/train_loop.sh
2-
3- # export WANDB_PROJECT_NAME="rl-algo-impls"
4-
51BENCHMARK_MAX_PROCS=" ${BENCHMARK_MAX_PROCS:- 5} "
62
7- ALGOS=(
8- # "vpg"
9- # "dqn"
10- " ppo"
11- )
3+ ALGO=" ppo"
124ENVS=(
135 " impala-PongNoFrameskip-v4"
146 " impala-BreakoutNoFrameskip-v4"
157 " impala-SpaceInvadersNoFrameskip-v4"
168 " impala-QbertNoFrameskip-v4"
179 " impala-CarRacing-v0"
1810)
19- train_loop " ${ALGOS[*]} " " ${ENVS[*]} " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
11+ bash benchmarks/ train_loop.sh -a $ALGO -e " ${ENVS[*]} " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
Original file line number Diff line number Diff line change 1- source benchmarks/train_loop.sh
2-
3- # export WANDB_PROJECT_NAME="rl-algo-impls"
4-
51BENCHMARK_MAX_PROCS=" ${BENCHMARK_MAX_PROCS:- 3} "
62
7- ALGOS=(
8- # "vpg"
9- # "dqn"
10- " ppo"
11- )
3+ ALGO=" ppo"
124ENVS=(
135 " procgen-coinrun-easy"
146 " procgen-starpilot-easy"
157 " procgen-bossfight-easy"
168 " procgen-bigfish-easy"
179)
18- train_loop " ${ALGOS[*]} " " ${ENVS[*]} " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
10+ bash benchmarks/ train_loop.sh -a $ALGO -e " ${ENVS[*]} " | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
You can’t perform that action at this time.
0 commit comments