Skip to content

Commit 3f5e668

Browse files
committed
Moved train_loop.sh into a script instead of a function
1 parent 1b67b52 commit 3f5e668

File tree

12 files changed

+53
-107
lines changed

12 files changed

+53
-107
lines changed

benchmarks/benchmark_test.sh

Lines changed: 0 additions & 32 deletions
This file was deleted.

benchmarks/colab_atari1.sh

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,4 @@
1-
source benchmarks/train_loop.sh
2-
ALGOS="ppo"
1+
ALGO="ppo"
32
ENVS="PongNoFrameskip-v4 BreakoutNoFrameskip-v4"
43
BENCHMARK_MAX_PROCS="${BENCHMARK_MAX_PROCS:-3}"
5-
train_loop $ALGOS "$ENVS" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
4+
bash benchmarks/train_loop.sh -a $ALGO -e "$ENVS" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD

benchmarks/colab_atari2.sh

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,4 @@
1-
source benchmarks/train_loop.sh
2-
ALGOS="ppo"
1+
ALGO="ppo"
32
ENVS="SpaceInvadersNoFrameskip-v4 QbertNoFrameskip-v4"
43
BENCHMARK_MAX_PROCS="${BENCHMARK_MAX_PROCS:-3}"
5-
train_loop $ALGOS "$ENVS" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
4+
bash benchmarks/train_loop.sh -a $ALGO -e "$ENVS" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD

benchmarks/colab_basic.sh

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,4 @@
1-
source benchmarks/train_loop.sh
2-
ALGOS="ppo"
1+
ALGO="ppo"
32
ENVS="CartPole-v1 MountainCar-v0 MountainCarContinuous-v0 Acrobot-v1 LunarLander-v2"
43
BENCHMARK_MAX_PROCS="${BENCHMARK_MAX_PROCS:-3}"
5-
train_loop $ALGOS "$ENVS" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
4+
bash benchmarks/train_loop.sh -a $ALGO -e "$ENVS" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD

benchmarks/colab_carracing.sh

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,4 @@
1-
source benchmarks/train_loop.sh
2-
ALGOS="ppo"
1+
ALGO="ppo"
32
ENVS="CarRacing-v0"
43
BENCHMARK_MAX_PROCS="${BENCHMARK_MAX_PROCS:-3}"
5-
train_loop $ALGOS "$ENVS" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
4+
bash benchmarks/train_loop.sh -a $ALGO -e "$ENVS" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD

benchmarks/colab_pybullet.sh

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,4 @@
1-
source benchmarks/train_loop.sh
2-
ALGOS="ppo"
1+
ALGO="ppo"
32
ENVS="HalfCheetahBulletEnv-v0 AntBulletEnv-v0 HopperBulletEnv-v0 Walker2DBulletEnv-v0"
43
BENCHMARK_MAX_PROCS="${BENCHMARK_MAX_PROCS:-3}"
5-
train_loop $ALGOS "$ENVS" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
4+
bash benchmarks/train_loop.sh -a $ALGO -e "$ENVS" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD

benchmarks/train_loop.sh

Lines changed: 17 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -1,15 +1,18 @@
1-
train_loop () {
2-
local WANDB_TAGS="benchmark_$(git rev-parse --short HEAD) host_$(hostname)"
3-
local algo
4-
local env
5-
local seed
6-
local WANDB_PROJECT_NAME="${WANDB_PROJECT_NAME:-rl-algo-impls-benchmarks}"
7-
local SEEDS="${SEEDS:-1 2 3}"
8-
for algo in $(echo $1); do
9-
for env in $(echo $2); do
10-
for seed in $SEEDS; do
11-
echo python train.py --algo $algo --env $env --seed $seed --pool-size 1 --wandb-tags $WANDB_TAGS --wandb-project-name $WANDB_PROJECT_NAME
12-
done
13-
done
1+
while getopts a:e:s:p: flag
2+
do
3+
case "${flag}" in
4+
a) algo=${OPTARG};;
5+
e) envs=${OPTARG};;
6+
s) seeds=${OPTARG};;
7+
p) project_name=${OPTARG};;
8+
esac
9+
done
10+
11+
WANDB_TAGS="benchmark_$(git rev-parse --short HEAD) host_$(hostname)"
12+
project_name="${project_name:-rl-algo-impls-benchmarks}"
13+
seeds="${seeds:-1 2 3}"
14+
for env in $(echo $envs); do
15+
for seed in $seeds; do
16+
echo python train.py --algo $algo --env $env --seed $seed --pool-size 1 --wandb-tags $WANDB_TAGS --wandb-project-name $project_name
1417
done
15-
}
18+
done

lambda_labs/benchmark.sh

Lines changed: 13 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -1,15 +1,17 @@
1-
source benchmarks/train_loop.sh
1+
while getopts a:j:s: flag
2+
do
3+
case "${flag}" in
4+
a) algo=${OPTARG};;
5+
j) n_jobs=${OPTARG};;
6+
p) project_name=${OPTARG};;
7+
s) seeds=${OPTARG};;
8+
esac
9+
done
210

3-
# export WANDB_PROJECT_NAME="rl-algo-impls"
11+
n_jobs="${n_jobs:-6}"
12+
project_name="${project_name:-rl-algo-impls-benchmarks}"
13+
seeds="${seeds:-1 2 3}"
414

5-
BENCHMARK_MAX_PROCS="${BENCHMARK_MAX_PROCS:-6}"
6-
7-
ALGOS=(
8-
# "vpg"
9-
# "dqn"
10-
"ppo"
11-
# "a2c"
12-
)
1315
ENVS=(
1416
# Basic
1517
"CartPole-v1"
@@ -31,4 +33,4 @@ ENVS=(
3133
"SpaceInvadersNoFrameskip-v4"
3234
"QbertNoFrameskip-v4"
3335
)
34-
train_loop "${ALGOS[*]}" "${ENVS[*]}" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
36+
bash benchmarks/train_loop.sh -a $algo -e "${ENVS[*]}" -p $project_name -s "$seeds" | xargs -I CMD -P $n_jobs bash -c CMD
Lines changed: 2 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,19 +1,11 @@
1-
source benchmarks/train_loop.sh
2-
3-
# export WANDB_PROJECT_NAME="rl-algo-impls"
4-
51
BENCHMARK_MAX_PROCS="${BENCHMARK_MAX_PROCS:-5}"
62

7-
ALGOS=(
8-
# "vpg"
9-
# "dqn"
10-
"ppo"
11-
)
3+
ALGO="ppo"
124
ENVS=(
135
"impala-PongNoFrameskip-v4"
146
"impala-BreakoutNoFrameskip-v4"
157
"impala-SpaceInvadersNoFrameskip-v4"
168
"impala-QbertNoFrameskip-v4"
179
"impala-CarRacing-v0"
1810
)
19-
train_loop "${ALGOS[*]}" "${ENVS[*]}" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
11+
bash benchmarks/train_loop.sh -a $ALGO -e "${ENVS[*]}" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD

lambda_labs/procgen_benchmark.sh

Lines changed: 2 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,18 +1,10 @@
1-
source benchmarks/train_loop.sh
2-
3-
# export WANDB_PROJECT_NAME="rl-algo-impls"
4-
51
BENCHMARK_MAX_PROCS="${BENCHMARK_MAX_PROCS:-3}"
62

7-
ALGOS=(
8-
# "vpg"
9-
# "dqn"
10-
"ppo"
11-
)
3+
ALGO="ppo"
124
ENVS=(
135
"procgen-coinrun-easy"
146
"procgen-starpilot-easy"
157
"procgen-bossfight-easy"
168
"procgen-bigfish-easy"
179
)
18-
train_loop "${ALGOS[*]}" "${ENVS[*]}" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD
10+
bash benchmarks/train_loop.sh -a $ALGO -e "${ENVS[*]}" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD

0 commit comments

Comments
 (0)