-
Notifications
You must be signed in to change notification settings - Fork 0
/
cooking_medoe.yaml
90 lines (86 loc) · 2.11 KB
/
cooking_medoe.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
defaults:
- env: cooking_base
- agents: bp_ippo
- run: train_10m
- logger: default_logger
- env@eval.env: ${env}
- hydra: hydra_slurm
- override agents/medoe/classifier: mlp_cooking
- _self_
hydra:
launcher:
timeout_min: 4320
cpus_per_task: 2
array_parallelism: 64
mem_per_cpu: 2G
sweep:
dir: multirun/${name}/${now:%Y-%m-%d}/${now:%H-%M-%S}
subdir: ${agents.medoe.zoo_alice}_${agents.medoe.zoo_bob}_${seed}_${agents.medoe.enable_medoe}_${agents.kl_coef}
sweeper:
params:
++agents.medoe.zoo_alice: milan-everitt,lisabeth-wainwright,aja-bacon,brett-henry
++agents.medoe.zoo_bob: marilee-dyerson,margot-quinnell,cathrine-laing,deeanna-helm
++agents.medoe.enable_medoe: true,false
++agents.kl_coef: 0,5e-3
name: cooking
seed: 1
zoo_path: cooking_zoo/zoo
agents:
zoo_path: ${zoo_path}
model:
actor:
- 256
- 128
critic:
- 256
- 128
ent_coef: 8e-3
lr:
actor: 4e-4
critic: 8e-4
n_steps: 16
n_epochs: 16
save_to_zoo: false
n_agents: 2
agents:
- agent_id: alice
save_to_zoo: true
zoo_name: ${agents.medoe.zoo_alice}
- agent_id: bob
save_to_zoo: true
zoo_name: ${agents.medoe.zoo_bob}
exp_buffer:
size: 0
replacement_prob: 0
medoe:
zoo_alice: ZOO_ALICE
zoo_bob: ZOO_BOB
classifier:
load_mode: load
path_to_classifier: ${zoo_path}/classifiers/${agents.medoe.zoo_alice}_${agents.medoe.zoo_bob}.pt
enable_medoe: false
reset_doe: false
base_vals:
temp: ${eval:'1.0/${sqrt:${agents.medoe.boost_vals.temp}}'}
ent: ${eval:'${agents.ent_coef}/${sqrt:${agents.medoe.boost_vals.ent}}'}
kl: ${eval:'${agents.kl_coef}/${sqrt:${agents.medoe.boost_vals.kl}}'}
clip: 1.0
boost_vals:
temp: 4.0
ent: 36.0
kl: 36.0
clip: 1.0
logger:
mode: online
enable_render: false
project: cooking-medoe
group: medoe
tags:
- AAMASCandidate
model_save_period:
# NB model save frequency needs to be high for the forgetting results!
val: 0.01
eval_period:
val: 0.02
train_metric_period:
val: 0.02